{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 设置driver"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-1-8ae4025e7ff4>:19: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,\n"
     ]
    }
   ],
   "source": [
    "from selenium import webdriver\n",
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "\n",
    "\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "# opts.binary_location = \"C:\\portable\\PortableApps\\IronPortable\\App\\Iron\\chrome.exe\"\n",
    "# opts.binary_location = \"C:\\Program Files\\Google\\Chrome\\Application\\chromedriver.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "\n",
    "driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 打开CNKI\n",
    "* 1.校园网，自动登录\n",
    "* 2.校外网，需要使用校外登录"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get('https://cnki.net')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 检查是否是中山大学南方学院登录"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "''"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_id('Ecp_loginShowName1').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 打开高级检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_id('highSearch')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 检查窗口\n",
    "* 只要是多个窗口，请检查窗口信息\n",
    "* 窗口信息根据窗口加载的顺序按照列表存储，每一个窗口又唯一识别的窗口ID"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'CDwindow-1B758225005A24641C60453EB64C9E1A'"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看当前窗口\n",
    "driver.current_window_handle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-1B758225005A24641C60453EB64C9E1A',\n",
       " 'CDwindow-1733F1EB275C115FE0876C7CDA5C1CB6']"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看所有窗口\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-8-704fdf3805c1>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 点击学术期刊（分类可自选）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//ul[@class=\"doctype-menus keji\"]/li[@data-id=\"xsqk\"]/a')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 点击专业检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/ul/li[4]')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 勾选SCI、CSSCI"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"EI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 北大核心\n",
    "element = driver.find_element_by_xpath('//input[@key=\"HX\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"CSI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"SI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"CSD\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 设置搜索query"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "# query = 'SU = \"新媒体\" AND (TI \"人工智能\" OR TI = \"大数据\" OR TI = \"big data\")'\n",
    "query = 'SU=\"大数据\"'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//textarea')\n",
    "element.clear()\n",
    "element.send_keys(query)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@value=\"检索\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 检查检索信息，更换页面文章数量"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'共找到<em>26,650</em>条结果'"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 检查数量\n",
    "element = driver.find_element_by_xpath('//span[@class=\"pagerTitleCell\"]')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//i[@class=\"icon icon-sort\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//div[@id=\"perPageDiv\"]//li[@data-val=\"50\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 抓取页面信息"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>智能化测绘的基本问题与发展方向  网络首发</td>\n",
       "      <td>陈军; 刘万增; 武昊; Songnian Li; 闫利</td>\n",
       "      <td>测绘学报</td>\n",
       "      <td>2021-07-06 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>国土空间开发适宜性评价的理论、方法与技术应用  网络首发</td>\n",
       "      <td>刘小波;王玉宽;李明</td>\n",
       "      <td>地球信息科学学报</td>\n",
       "      <td>2021-07-06 15:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发</td>\n",
       "      <td>李燕云;王永明;周奇;李亦学;王振</td>\n",
       "      <td>复旦学报(医学版)</td>\n",
       "      <td>2021-07-06 15:53</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>铁路盾构隧道智能建造技术现状与展望  网络首发</td>\n",
       "      <td>陈丹; 刘喆; 刘建友; 房倩; 海路</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-07-06 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发</td>\n",
       "      <td>郑翔; 山茂峰</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-06 15:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>互联网旅游统计体系初探  网络首发</td>\n",
       "      <td>刘冰洁; 李倩; 赵彦云</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-07-05 17:36</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>基于处方序列与处方序列对称分析的中药药物警戒  网络首发</td>\n",
       "      <td>吕健; 王连心; 谢雁鸣</td>\n",
       "      <td>中国中药杂志</td>\n",
       "      <td>2021-07-05 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>大数据金融：小微企业金融服务的创新与思考  网络首发</td>\n",
       "      <td>丁廉业</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发</td>\n",
       "      <td>陈游</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>三支决策在工业大数据中的应用  网络首发</td>\n",
       "      <td>于洪; 杨雪梅</td>\n",
       "      <td>西北大学学报(自然科学版)</td>\n",
       "      <td>2021-07-05 14:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发</td>\n",
       "      <td>张艾荣; 吕娜</td>\n",
       "      <td>软科学</td>\n",
       "      <td>2021-07-05 13:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据时代中国共产党的形象建构：挑战与应对  网络首发</td>\n",
       "      <td>苏玉波; 刘婷婷</td>\n",
       "      <td>西安交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-05 13:37</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>电子信息领域硕士研究生工程伦理课程建设  网络首发</td>\n",
       "      <td>周林娜; 常俊林; 代伟; 杨春雨</td>\n",
       "      <td>控制工程</td>\n",
       "      <td>2021-07-05 13:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>中国经济发展规律与理论研究关键科学问题  网络首发</td>\n",
       "      <td>刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发</td>\n",
       "      <td>王琳; 赖茂生</td>\n",
       "      <td>中国图书馆学报</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发</td>\n",
       "      <td>叶晗;吴博文;许红卫;干牧野;张晶</td>\n",
       "      <td>浙江农业学报</td>\n",
       "      <td>2021-07-05 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于靶向最大似然估计模型在高血压药物疗效评价中的应用</td>\n",
       "      <td>潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 09:15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>计算机技术在储能系统中的应用研究</td>\n",
       "      <td>李骏; 杨雅志</td>\n",
       "      <td>储能科学与技术</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>面向代码相似性检测的相似哈希改进方法</td>\n",
       "      <td>李玫;高庆;马森;张世琨;胡文蕙</td>\n",
       "      <td>软件学报</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发</td>\n",
       "      <td>马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜</td>\n",
       "      <td>地球科学进展</td>\n",
       "      <td>2021-07-02 15:58</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下档案信息服务体系构建方法探析</td>\n",
       "      <td>孔媛媛; 张舒; 王爱</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 09:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>数据赋能教育治理创新:内涵、机制与实践</td>\n",
       "      <td>张培; 夏海鹰</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>社交媒体大数据的教育应用研究:价值、路径与挑战</td>\n",
       "      <td>李彤彤; 李坦; 郭栩宁</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据时代的科学实在论发展趋向及其特征</td>\n",
       "      <td>刘伟伟</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>健康医疗大数据公平问题研究</td>\n",
       "      <td>李晓洁; 丛亚丽</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>互联网平台滥用市场支配地位行为规制的困境与出路  网络首发</td>\n",
       "      <td>谭袁</td>\n",
       "      <td>法治研究</td>\n",
       "      <td>2021-07-01 15:17</td>\n",
       "      <td>NaN</td>\n",
       "      <td>27.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>铁路调度集中系统调车作业时间智能预测方法研究  网络首发</td>\n",
       "      <td>韩浪; 王壮锋; 张春德</td>\n",
       "      <td>铁道标准设计</td>\n",
       "      <td>2021-07-01 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>医院财务智能化转型路径探析  网络首发</td>\n",
       "      <td>刘波; 曾绍颖; 张晓玮; 李琼</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>数据开放共享与个人隐私保护对策研究——层次数据与算法问责</td>\n",
       "      <td>窦悦</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>全球主要生态退化区和研究热点区的空间分布与演变  网络首发</td>\n",
       "      <td>张云芝; 胡云锋; 韩月琪; 战胜</td>\n",
       "      <td>生态学报</td>\n",
       "      <td>2021-06-30 10:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>地理综合研究方法的发展与思考  网络首发</td>\n",
       "      <td>闾国年;周成虎;林珲;陈旻;乐松山</td>\n",
       "      <td>科学通报</td>\n",
       "      <td>2021-06-30 09:12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>31.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发</td>\n",
       "      <td>张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜</td>\n",
       "      <td>航空学报</td>\n",
       "      <td>2021-06-29 17:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>52.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>170.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>83.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>新时代发挥统计监督职能的思考</td>\n",
       "      <td>李金昌; 余卫</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 15:43</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>近20年长江经济带生态环境变化  网络首发</td>\n",
       "      <td>周权平;张澎彬;薛腾飞;姜月华;郭琳</td>\n",
       "      <td>中国地质</td>\n",
       "      <td>2021-06-29 14:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发</td>\n",
       "      <td>丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-29 14:34</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>基于配网新形态下电费风险模型构建与应用  网络首发</td>\n",
       "      <td>戴璐平; 瞿青; 黄露; 潘晔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 14:00</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>规模以下工业抽样设计研究</td>\n",
       "      <td>万舒晨</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 11:06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                        智能化测绘的基本问题与发展方向  网络首发   \n",
       "1            2                 国土空间开发适宜性评价的理论、方法与技术应用  网络首发   \n",
       "2            3              基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发   \n",
       "3            4                      铁路盾构隧道智能建造技术现状与展望  网络首发   \n",
       "4            5         互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发   \n",
       "5            6                      森林生态站大数据快速存储与索引方法  网络首发   \n",
       "6            7                            互联网旅游统计体系初探  网络首发   \n",
       "7            8                 基于处方序列与处方序列对称分析的中药药物警戒  网络首发   \n",
       "8            9                   大数据金融：小微企业金融服务的创新与思考  网络首发   \n",
       "9           10  我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发   \n",
       "10          11                         三支决策在工业大数据中的应用  网络首发   \n",
       "11          12               大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发   \n",
       "12          13                  大数据时代中国共产党的形象建构：挑战与应对  网络首发   \n",
       "13          14                    电子信息领域硕士研究生工程伦理课程建设  网络首发   \n",
       "14          15                    中国经济发展规律与理论研究关键科学问题  网络首发   \n",
       "15          16               中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发   \n",
       "16          17     基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发   \n",
       "17          18                   基于靶向最大似然估计模型在高血压药物疗效评价中的应用   \n",
       "18          19          基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发   \n",
       "19          20                基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例   \n",
       "20          21                             计算机技术在储能系统中的应用研究   \n",
       "21          22                           面向代码相似性检测的相似哈希改进方法   \n",
       "22          23              国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发   \n",
       "23          24                   金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "24          25                         大数据背景下档案信息服务体系构建方法探析   \n",
       "25          26                          数据赋能教育治理创新:内涵、机制与实践   \n",
       "26          27                      社交媒体大数据的教育应用研究:价值、路径与挑战   \n",
       "27          28                          大数据时代的科学实在论发展趋向及其特征   \n",
       "28          29                                健康医疗大数据公平问题研究   \n",
       "29          30                       智能财务人才培养与浙江大学的探索  网络首发   \n",
       "30          31                互联网平台滥用市场支配地位行为规制的困境与出路  网络首发   \n",
       "31          32                 铁路调度集中系统调车作业时间智能预测方法研究  网络首发   \n",
       "32          33                          医院财务智能化转型路径探析  网络首发   \n",
       "33          34                 数据开放共享与个人隐私保护对策研究——层次数据与算法问责   \n",
       "34          35                全球主要生态退化区和研究热点区的空间分布与演变  网络首发   \n",
       "35          36        基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发   \n",
       "36          37              基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例   \n",
       "37          38                         地理综合研究方法的发展与思考  网络首发   \n",
       "38          39                              绿色理念下智慧零售创新发展路径   \n",
       "39          40           数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "40          41     基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发   \n",
       "41          42              我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发   \n",
       "42          43                    我国大数据审计研究综述——基于中文核心期刊文献研究   \n",
       "43          44                 智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "44          45                       “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "45          46                               新时代发挥统计监督职能的思考   \n",
       "46          47                        近20年长江经济带生态环境变化  网络首发   \n",
       "47          48        科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发   \n",
       "48          49                    基于配网新形态下电费风险模型构建与应用  网络首发   \n",
       "49          50                                 规模以下工业抽样设计研究   \n",
       "\n",
       "                              作者               刊名              发表时间  被引  \\\n",
       "0   陈军; 刘万增; 武昊; Songnian Li; 闫利             测绘学报  2021-07-06 16:16 NaN   \n",
       "1                     刘小波;王玉宽;李明         地球信息科学学报  2021-07-06 15:54 NaN   \n",
       "2              李燕云;王永明;周奇;李亦学;王振        复旦学报(医学版)  2021-07-06 15:53 NaN   \n",
       "3            陈丹; 刘喆; 刘建友; 房倩; 海路        隧道建设(中英文)  2021-07-06 15:51 NaN   \n",
       "4                        郑翔; 山茂峰  北京交通大学学报(社会科学版)  2021-07-06 15:03 NaN   \n",
       "5         王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福           农业机械学报  2021-07-06 09:48 NaN   \n",
       "6                   刘冰洁; 李倩; 赵彦云            统计与决策  2021-07-05 17:36 NaN   \n",
       "7                   吕健; 王连心; 谢雁鸣           中国中药杂志  2021-07-05 15:51 NaN   \n",
       "8                            丁廉业             西南金融  2021-07-05 15:20 NaN   \n",
       "9                             陈游             西南金融  2021-07-05 15:20 NaN   \n",
       "10                       于洪; 杨雪梅    西北大学学报(自然科学版)  2021-07-05 14:19 NaN   \n",
       "11                       张艾荣; 吕娜              软科学  2021-07-05 13:38 NaN   \n",
       "12                      苏玉波; 刘婷婷  西安交通大学学报(社会科学版)  2021-07-05 13:37 NaN   \n",
       "13             周林娜; 常俊林; 代伟; 杨春雨             控制工程  2021-07-05 13:04 NaN   \n",
       "14       刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪           中国科学基金  2021-07-05 11:11 NaN   \n",
       "15                       王琳; 赖茂生          中国图书馆学报  2021-07-05 11:11 NaN   \n",
       "16             叶晗;吴博文;许红卫;干牧野;张晶           浙江农业学报  2021-07-05 11:09 NaN   \n",
       "17           潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振         中华疾病控制杂志  2021-07-05 09:15 NaN   \n",
       "18               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "19               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "20                       李骏; 杨雅志          储能科学与技术        2021-07-05 NaN   \n",
       "21              李玫;高庆;马森;张世琨;胡文蕙             软件学报        2021-07-05 NaN   \n",
       "22           马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜           地球科学进展  2021-07-02 15:58 NaN   \n",
       "23                 陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN   \n",
       "24                   孔媛媛; 张舒; 王爱            档案与建设  2021-07-02 09:42 NaN   \n",
       "25                       张培; 夏海鹰           中国远程教育        2021-07-02 NaN   \n",
       "26                  李彤彤; 李坦; 郭栩宁           中国远程教育        2021-07-02 NaN   \n",
       "27                           刘伟伟          自然辩证法通讯        2021-07-02 NaN   \n",
       "28                      李晓洁; 丛亚丽          自然辩证法通讯        2021-07-02 NaN   \n",
       "29                        陈俊; 董望             财会月刊  2021-07-01 15:42 NaN   \n",
       "30                            谭袁             法治研究  2021-07-01 15:17 NaN   \n",
       "31                  韩浪; 王壮锋; 张春德           铁道标准设计  2021-07-01 15:09 NaN   \n",
       "32              刘波; 曾绍颖; 张晓玮; 李琼             财会月刊  2021-07-01 11:09 NaN   \n",
       "33                            窦悦             现代情报        2021-07-01 NaN   \n",
       "34             张云芝; 胡云锋; 韩月琪; 战胜             生态学报  2021-06-30 10:04 NaN   \n",
       "35         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "36         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "37             闾国年;周成虎;林珲;陈旻;乐松山             科学通报  2021-06-30 09:12 NaN   \n",
       "38                            翟璇           商业经济研究        2021-06-30 NaN   \n",
       "39                           单浩耘           商业经济研究        2021-06-30 NaN   \n",
       "40       张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜             航空学报  2021-06-29 17:19 NaN   \n",
       "41         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "42         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "43                           乔宇锋             南方金融  2021-06-29 17:04 NaN   \n",
       "44                      解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   \n",
       "45                       李金昌; 余卫             统计研究  2021-06-29 15:43 NaN   \n",
       "46            周权平;张澎彬;薛腾飞;姜月华;郭琳             中国地质  2021-06-29 14:54 NaN   \n",
       "47        丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬          情报理论与实践  2021-06-29 14:34 NaN   \n",
       "48               戴璐平; 瞿青; 黄露; 潘晔             中国电力  2021-06-29 14:00 NaN   \n",
       "49                           万舒晨             统计研究  2021-06-29 11:06 NaN   \n",
       "\n",
       "       下载  操作  \n",
       "0     NaN  下载  \n",
       "1     NaN  下载  \n",
       "2     NaN  下载  \n",
       "3     NaN  下载  \n",
       "4     NaN  下载  \n",
       "5     NaN  下载  \n",
       "6     NaN  下载  \n",
       "7     NaN  下载  \n",
       "8     NaN  下载  \n",
       "9     NaN  下载  \n",
       "10    NaN  下载  \n",
       "11    NaN  下载  \n",
       "12    NaN  下载  \n",
       "13    NaN  下载  \n",
       "14    NaN  下载  \n",
       "15    NaN  下载  \n",
       "16    NaN  下载  \n",
       "17    NaN  下载  \n",
       "18    NaN  下载  \n",
       "19    NaN  下载  \n",
       "20    NaN  下载  \n",
       "21    NaN  下载  \n",
       "22    NaN  下载  \n",
       "23    NaN  下载  \n",
       "24    NaN  下载  \n",
       "25    NaN  下载  \n",
       "26    NaN  下载  \n",
       "27    NaN  下载  \n",
       "28    NaN  下载  \n",
       "29   53.0  下载  \n",
       "30   27.0  下载  \n",
       "31   11.0  下载  \n",
       "32   19.0  下载  \n",
       "33    5.0  下载  \n",
       "34   43.0  下载  \n",
       "35   43.0  下载  \n",
       "36    NaN  下载  \n",
       "37   31.0  下载  \n",
       "38   28.0  下载  \n",
       "39   56.0  下载  \n",
       "40   52.0  下载  \n",
       "41  170.0  下载  \n",
       "42    NaN  下载  \n",
       "43  119.0  下载  \n",
       "44   83.0  下载  \n",
       "45   33.0  下载  \n",
       "46   58.0  下载  \n",
       "47   56.0  下载  \n",
       "48   23.0  下载  \n",
       "49   28.0  下载  "
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element=driver.find_element_by_id('gridTable')\n",
    "页面_表格_html=element.get_attribute('innerHTML')\n",
    "pd.read_html(页面_表格_html)[0]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 详细页链接"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "import re\n",
    "from lxml.html import fromstring"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [],
   "source": [
    "html = driver.page_source\n",
    "root = fromstring(html)\n",
    "href = [x for x in root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')]\n",
    "\n",
    "def correct(href):\n",
    "    DbCode = re.findall(\"DbCode=(.*?)&\",href)[0]\n",
    "    dbname = re.findall(\"dbname=(.*?)&\",href)[0]\n",
    "    filename = re.findall(\"filename=(.*?)&\",href)[0]\n",
    "    href = f\"https://kns.cnki.net/kcms/detail/detail.aspx?dbcode={DbCode}&dbname={dbname}&filename={filename}\"\n",
    "    return href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>智能化测绘的基本问题与发展方向  网络首发</td>\n",
       "      <td>陈军; 刘万增; 武昊; Songnian Li; 闫利</td>\n",
       "      <td>测绘学报</td>\n",
       "      <td>2021-07-06 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>国土空间开发适宜性评价的理论、方法与技术应用  网络首发</td>\n",
       "      <td>刘小波;王玉宽;李明</td>\n",
       "      <td>地球信息科学学报</td>\n",
       "      <td>2021-07-06 15:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发</td>\n",
       "      <td>李燕云;王永明;周奇;李亦学;王振</td>\n",
       "      <td>复旦学报(医学版)</td>\n",
       "      <td>2021-07-06 15:53</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>铁路盾构隧道智能建造技术现状与展望  网络首发</td>\n",
       "      <td>陈丹; 刘喆; 刘建友; 房倩; 海路</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-07-06 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发</td>\n",
       "      <td>郑翔; 山茂峰</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-06 15:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>互联网旅游统计体系初探  网络首发</td>\n",
       "      <td>刘冰洁; 李倩; 赵彦云</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-07-05 17:36</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>基于处方序列与处方序列对称分析的中药药物警戒  网络首发</td>\n",
       "      <td>吕健; 王连心; 谢雁鸣</td>\n",
       "      <td>中国中药杂志</td>\n",
       "      <td>2021-07-05 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>大数据金融：小微企业金融服务的创新与思考  网络首发</td>\n",
       "      <td>丁廉业</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发</td>\n",
       "      <td>陈游</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>三支决策在工业大数据中的应用  网络首发</td>\n",
       "      <td>于洪; 杨雪梅</td>\n",
       "      <td>西北大学学报(自然科学版)</td>\n",
       "      <td>2021-07-05 14:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发</td>\n",
       "      <td>张艾荣; 吕娜</td>\n",
       "      <td>软科学</td>\n",
       "      <td>2021-07-05 13:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据时代中国共产党的形象建构：挑战与应对  网络首发</td>\n",
       "      <td>苏玉波; 刘婷婷</td>\n",
       "      <td>西安交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-05 13:37</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>电子信息领域硕士研究生工程伦理课程建设  网络首发</td>\n",
       "      <td>周林娜; 常俊林; 代伟; 杨春雨</td>\n",
       "      <td>控制工程</td>\n",
       "      <td>2021-07-05 13:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>中国经济发展规律与理论研究关键科学问题  网络首发</td>\n",
       "      <td>刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发</td>\n",
       "      <td>王琳; 赖茂生</td>\n",
       "      <td>中国图书馆学报</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发</td>\n",
       "      <td>叶晗;吴博文;许红卫;干牧野;张晶</td>\n",
       "      <td>浙江农业学报</td>\n",
       "      <td>2021-07-05 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于靶向最大似然估计模型在高血压药物疗效评价中的应用</td>\n",
       "      <td>潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 09:15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>计算机技术在储能系统中的应用研究</td>\n",
       "      <td>李骏; 杨雅志</td>\n",
       "      <td>储能科学与技术</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>面向代码相似性检测的相似哈希改进方法</td>\n",
       "      <td>李玫;高庆;马森;张世琨;胡文蕙</td>\n",
       "      <td>软件学报</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发</td>\n",
       "      <td>马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜</td>\n",
       "      <td>地球科学进展</td>\n",
       "      <td>2021-07-02 15:58</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下档案信息服务体系构建方法探析</td>\n",
       "      <td>孔媛媛; 张舒; 王爱</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 09:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>数据赋能教育治理创新:内涵、机制与实践</td>\n",
       "      <td>张培; 夏海鹰</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>社交媒体大数据的教育应用研究:价值、路径与挑战</td>\n",
       "      <td>李彤彤; 李坦; 郭栩宁</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据时代的科学实在论发展趋向及其特征</td>\n",
       "      <td>刘伟伟</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>健康医疗大数据公平问题研究</td>\n",
       "      <td>李晓洁; 丛亚丽</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>互联网平台滥用市场支配地位行为规制的困境与出路  网络首发</td>\n",
       "      <td>谭袁</td>\n",
       "      <td>法治研究</td>\n",
       "      <td>2021-07-01 15:17</td>\n",
       "      <td>NaN</td>\n",
       "      <td>27.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>铁路调度集中系统调车作业时间智能预测方法研究  网络首发</td>\n",
       "      <td>韩浪; 王壮锋; 张春德</td>\n",
       "      <td>铁道标准设计</td>\n",
       "      <td>2021-07-01 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>医院财务智能化转型路径探析  网络首发</td>\n",
       "      <td>刘波; 曾绍颖; 张晓玮; 李琼</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>数据开放共享与个人隐私保护对策研究——层次数据与算法问责</td>\n",
       "      <td>窦悦</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>全球主要生态退化区和研究热点区的空间分布与演变  网络首发</td>\n",
       "      <td>张云芝; 胡云锋; 韩月琪; 战胜</td>\n",
       "      <td>生态学报</td>\n",
       "      <td>2021-06-30 10:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>地理综合研究方法的发展与思考  网络首发</td>\n",
       "      <td>闾国年;周成虎;林珲;陈旻;乐松山</td>\n",
       "      <td>科学通报</td>\n",
       "      <td>2021-06-30 09:12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>31.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发</td>\n",
       "      <td>张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜</td>\n",
       "      <td>航空学报</td>\n",
       "      <td>2021-06-29 17:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>52.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>170.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>83.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>新时代发挥统计监督职能的思考</td>\n",
       "      <td>李金昌; 余卫</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 15:43</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>近20年长江经济带生态环境变化  网络首发</td>\n",
       "      <td>周权平;张澎彬;薛腾飞;姜月华;郭琳</td>\n",
       "      <td>中国地质</td>\n",
       "      <td>2021-06-29 14:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发</td>\n",
       "      <td>丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-29 14:34</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>基于配网新形态下电费风险模型构建与应用  网络首发</td>\n",
       "      <td>戴璐平; 瞿青; 黄露; 潘晔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 14:00</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>规模以下工业抽样设计研究</td>\n",
       "      <td>万舒晨</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 11:06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                        智能化测绘的基本问题与发展方向  网络首发   \n",
       "1            2                 国土空间开发适宜性评价的理论、方法与技术应用  网络首发   \n",
       "2            3              基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发   \n",
       "3            4                      铁路盾构隧道智能建造技术现状与展望  网络首发   \n",
       "4            5         互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发   \n",
       "5            6                      森林生态站大数据快速存储与索引方法  网络首发   \n",
       "6            7                            互联网旅游统计体系初探  网络首发   \n",
       "7            8                 基于处方序列与处方序列对称分析的中药药物警戒  网络首发   \n",
       "8            9                   大数据金融：小微企业金融服务的创新与思考  网络首发   \n",
       "9           10  我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发   \n",
       "10          11                         三支决策在工业大数据中的应用  网络首发   \n",
       "11          12               大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发   \n",
       "12          13                  大数据时代中国共产党的形象建构：挑战与应对  网络首发   \n",
       "13          14                    电子信息领域硕士研究生工程伦理课程建设  网络首发   \n",
       "14          15                    中国经济发展规律与理论研究关键科学问题  网络首发   \n",
       "15          16               中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发   \n",
       "16          17     基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发   \n",
       "17          18                   基于靶向最大似然估计模型在高血压药物疗效评价中的应用   \n",
       "18          19          基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发   \n",
       "19          20                基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例   \n",
       "20          21                             计算机技术在储能系统中的应用研究   \n",
       "21          22                           面向代码相似性检测的相似哈希改进方法   \n",
       "22          23              国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发   \n",
       "23          24                   金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "24          25                         大数据背景下档案信息服务体系构建方法探析   \n",
       "25          26                          数据赋能教育治理创新:内涵、机制与实践   \n",
       "26          27                      社交媒体大数据的教育应用研究:价值、路径与挑战   \n",
       "27          28                          大数据时代的科学实在论发展趋向及其特征   \n",
       "28          29                                健康医疗大数据公平问题研究   \n",
       "29          30                       智能财务人才培养与浙江大学的探索  网络首发   \n",
       "30          31                互联网平台滥用市场支配地位行为规制的困境与出路  网络首发   \n",
       "31          32                 铁路调度集中系统调车作业时间智能预测方法研究  网络首发   \n",
       "32          33                          医院财务智能化转型路径探析  网络首发   \n",
       "33          34                 数据开放共享与个人隐私保护对策研究——层次数据与算法问责   \n",
       "34          35                全球主要生态退化区和研究热点区的空间分布与演变  网络首发   \n",
       "35          36        基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发   \n",
       "36          37              基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例   \n",
       "37          38                         地理综合研究方法的发展与思考  网络首发   \n",
       "38          39                              绿色理念下智慧零售创新发展路径   \n",
       "39          40           数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "40          41     基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发   \n",
       "41          42              我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发   \n",
       "42          43                    我国大数据审计研究综述——基于中文核心期刊文献研究   \n",
       "43          44                 智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "44          45                       “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "45          46                               新时代发挥统计监督职能的思考   \n",
       "46          47                        近20年长江经济带生态环境变化  网络首发   \n",
       "47          48        科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发   \n",
       "48          49                    基于配网新形态下电费风险模型构建与应用  网络首发   \n",
       "49          50                                 规模以下工业抽样设计研究   \n",
       "\n",
       "                              作者               刊名              发表时间  被引  \\\n",
       "0   陈军; 刘万增; 武昊; Songnian Li; 闫利             测绘学报  2021-07-06 16:16 NaN   \n",
       "1                     刘小波;王玉宽;李明         地球信息科学学报  2021-07-06 15:54 NaN   \n",
       "2              李燕云;王永明;周奇;李亦学;王振        复旦学报(医学版)  2021-07-06 15:53 NaN   \n",
       "3            陈丹; 刘喆; 刘建友; 房倩; 海路        隧道建设(中英文)  2021-07-06 15:51 NaN   \n",
       "4                        郑翔; 山茂峰  北京交通大学学报(社会科学版)  2021-07-06 15:03 NaN   \n",
       "5         王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福           农业机械学报  2021-07-06 09:48 NaN   \n",
       "6                   刘冰洁; 李倩; 赵彦云            统计与决策  2021-07-05 17:36 NaN   \n",
       "7                   吕健; 王连心; 谢雁鸣           中国中药杂志  2021-07-05 15:51 NaN   \n",
       "8                            丁廉业             西南金融  2021-07-05 15:20 NaN   \n",
       "9                             陈游             西南金融  2021-07-05 15:20 NaN   \n",
       "10                       于洪; 杨雪梅    西北大学学报(自然科学版)  2021-07-05 14:19 NaN   \n",
       "11                       张艾荣; 吕娜              软科学  2021-07-05 13:38 NaN   \n",
       "12                      苏玉波; 刘婷婷  西安交通大学学报(社会科学版)  2021-07-05 13:37 NaN   \n",
       "13             周林娜; 常俊林; 代伟; 杨春雨             控制工程  2021-07-05 13:04 NaN   \n",
       "14       刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪           中国科学基金  2021-07-05 11:11 NaN   \n",
       "15                       王琳; 赖茂生          中国图书馆学报  2021-07-05 11:11 NaN   \n",
       "16             叶晗;吴博文;许红卫;干牧野;张晶           浙江农业学报  2021-07-05 11:09 NaN   \n",
       "17           潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振         中华疾病控制杂志  2021-07-05 09:15 NaN   \n",
       "18               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "19               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "20                       李骏; 杨雅志          储能科学与技术        2021-07-05 NaN   \n",
       "21              李玫;高庆;马森;张世琨;胡文蕙             软件学报        2021-07-05 NaN   \n",
       "22           马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜           地球科学进展  2021-07-02 15:58 NaN   \n",
       "23                 陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN   \n",
       "24                   孔媛媛; 张舒; 王爱            档案与建设  2021-07-02 09:42 NaN   \n",
       "25                       张培; 夏海鹰           中国远程教育        2021-07-02 NaN   \n",
       "26                  李彤彤; 李坦; 郭栩宁           中国远程教育        2021-07-02 NaN   \n",
       "27                           刘伟伟          自然辩证法通讯        2021-07-02 NaN   \n",
       "28                      李晓洁; 丛亚丽          自然辩证法通讯        2021-07-02 NaN   \n",
       "29                        陈俊; 董望             财会月刊  2021-07-01 15:42 NaN   \n",
       "30                            谭袁             法治研究  2021-07-01 15:17 NaN   \n",
       "31                  韩浪; 王壮锋; 张春德           铁道标准设计  2021-07-01 15:09 NaN   \n",
       "32              刘波; 曾绍颖; 张晓玮; 李琼             财会月刊  2021-07-01 11:09 NaN   \n",
       "33                            窦悦             现代情报        2021-07-01 NaN   \n",
       "34             张云芝; 胡云锋; 韩月琪; 战胜             生态学报  2021-06-30 10:04 NaN   \n",
       "35         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "36         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "37             闾国年;周成虎;林珲;陈旻;乐松山             科学通报  2021-06-30 09:12 NaN   \n",
       "38                            翟璇           商业经济研究        2021-06-30 NaN   \n",
       "39                           单浩耘           商业经济研究        2021-06-30 NaN   \n",
       "40       张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜             航空学报  2021-06-29 17:19 NaN   \n",
       "41         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "42         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "43                           乔宇锋             南方金融  2021-06-29 17:04 NaN   \n",
       "44                      解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   \n",
       "45                       李金昌; 余卫             统计研究  2021-06-29 15:43 NaN   \n",
       "46            周权平;张澎彬;薛腾飞;姜月华;郭琳             中国地质  2021-06-29 14:54 NaN   \n",
       "47        丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬          情报理论与实践  2021-06-29 14:34 NaN   \n",
       "48               戴璐平; 瞿青; 黄露; 潘晔             中国电力  2021-06-29 14:00 NaN   \n",
       "49                           万舒晨             统计研究  2021-06-29 11:06 NaN   \n",
       "\n",
       "       下载  操作                                              详细页链接  \n",
       "0     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "1     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "2     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "3     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "4     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "5     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "6     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "7     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "8     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "9     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "10    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "11    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "12    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "13    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "14    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "15    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "16    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "17    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "18    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "19    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "20    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "21    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "22    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "23    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "24    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "25    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "26    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "27    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "28    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "29   53.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "30   27.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "31   11.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "32   19.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "33    5.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "34   43.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "35   43.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "36    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "37   31.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "38   28.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "39   56.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "40   52.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "41  170.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "42    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "43  119.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "44   83.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "45   33.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "46   58.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "47   56.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "48   23.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "49   28.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...  "
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "links=[]\n",
    "\n",
    "for link in href:\n",
    "    link=correct(link)\n",
    "    links.append(link)\n",
    "    df_links=pd.DataFrame({'详细页链接':links})\n",
    "    df_首页=pd.concat([pd.read_html(页面_表格_html)[0],df_links],axis=1)\n",
    "\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# PDF链接"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "import urllib.parse"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['/kcms/download.aspx?filename=rYGVSFGZQhUTshVdVl2MiJXWLVVVZlVZ6dTdQhFNSdzMFRnS1p0TsxmNQN2NyIDZCJ3RWx0bQJlbWZ1YY1kbxZkSrFDVvRzSZF0KFRWRzQjQ3NWb4hXRPdFTwZjQycGVZpWa3M0Tv9iRL9yLUJ0QpVWRthzRutmR&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=P9kQZt0d3JVTnBnUolDej9iTZBleKV0ZO9GMZpWQ5pmRxQjbv5WR0QVb1EzTH9kSGRVVK9mURVXeSlWaPtCOlFkZ5pWdVtCTxgVW0NTOnZzQkNDcDVnaYp0NIZmdmBlNLpmWmlXQJ1Ec3o3TCRndhRTQXRkaCl0Z&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=xcDbhFHcLpHaLNWeadGU0cXMvdDT1lGM0IDbw9kb2BTSjJ0LDpHOVdkT61mVDpFbOBFZTt0QLZWUPZHcnpkWrMlYyMmMmp0dr5mYvlzcSNEaRVXMv9iUsJWS28mS2gDWhZVS2J2atJXYmVVTGxkM2gjTXRDcEp2L&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=a50YwI3UxR0VLBXSjRkclBzMMFVWiNGbVFzT0NmS1dHSPlDRnlXMykTUXRkQ1dTaZp2YOVndsFndpZ2cuZmRtt0SVBjVlB3QN9EUjFmMWRXeFh1USh0KjNzNORVWwk0bw92TxtSaCdDZLtUYlNkYrR2dyUEdJtmb&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uNHTpRDd2cUcWplaOZ1R3Ynd502LzRWa3U0QrRDVppXczc2aLVVR2J2NvR1d2sUNFZzUpFlZtJ2TlNneo9SUwp3N4VzdLBTamRzKKZXOPlneuZHdwsmdkBjcMlnQURjSHdzMDd0QaRWYp5GOXBHNIB3Q2c1bRF2T&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=udEa1ZET0wkNSBjTxx2YJtWUkBleDtWdqlXdBlmb4M1dOJmeHZmZ2VDTQh3ctVWNXpEO4IUWO1GdHN2QHNDRVZWOvR2aWRTT3YGO4c1aqlTaLZ3LRp0T1YGMsJlR0dUb080RqZjUJZ2Mw8WVKBVYtJ0T5AjM1kGV&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=VFDMyk0Z0MHRNlnbMN3T4lTeTVHOmlDNTtiRPFGRBlkW1tSW4hHcBZ3dl9iQPp0aJp1LJhkQwhmcYFWTpZUYRFTT4NmN1F2bLN1VkVTSslEarcVS0g3KHdWd3pHN2Q2L0RXbYlHe4g1TyV3Z4czd2F1Z65WSHhFU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=vJXb6Vzd0MnaT9UN0Y1b3EHRkJDR2xEZSFWZRpUOih3ZOljUxcGSStyLv42aoNnYiZzVVpXdJJEWytEUHJmRwFkZBhFNLZDZKVTdLpWSsV2M4F0NQ90aQBXe1J2LNFDTmlFNWhUQlNkaxpnbQJ0TSV0K1MVdJpmN&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=CZlMWdlRzBnZx1maCl1YHd3QrZXMHVzNYd2RMdlWVNTQwVzZ1BXYMBnYYh0b6JFS5N3YrZFWKxGcuh1V2pmbwlje0pkQBxWbWRTdFdlbItiWkxkUrR2MHRETpVjQsVkZOVzYPB3YPpUYqdFUIFTM5J2LVl0MztWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=YpFbktEWil0UMh1SRFkYN9kesRTSipUUFhWUKRDMmFEW0cGRuZkSYVGbygjN582RsBXMCFHSM9kQrt2Y2N1Sll1bRpGRll3QqVGbo9EU0JENuV0KNVka5hzLwoGTkpGUCNTO6ZkaEZTRF5mboRjU1EDUOlzNFJkR&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=htGe28kYx9iaro1QTNHTOR3dqRUczQVO5U0QHVzQsdTdF52VNRWUQ5mMnVkR3UXa2FmcldHbutUeJhWbwVnT6RDW0ZFcNNUMotWTohkTnljZzJmQwUFayBXMxFDR6tGOyo3U6RGVDt0LCN1YvYmYixEeztUdKZDO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=iZzYWR0bE52ZER0Qzkjb1YEWuR1LjR0Zm9yUVFUavhVOoFDbCRGVHl3UrtmTrcFb0o0SIJ1aqJUdwJ2RM5EcwEkQmx2cwIVRXdGdKNjQ2oXYFl3SBd3dBRjVQJkV2EHTyJ1bqFkVWh1NEdUa6lXcTtyUXhnRSdnR&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mNUMuh1ZvokQvkGZzRHdI5UZ3FTRx1URUBHTrQ0NMdDbCZVZIFESXdTRnVWThR0aYFGW20WVsZWRtdXTId2avZHe4RTeJh2LOdEe2JFa3NmMY10Kzs0dsNTYSp0R0lmWGd0ZMJje3UVYzN0ZVl2YrwkY5kkSjx0K&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=Nt2VRd3KohTa3FVboVTNyJVY0R3cFNDMENnVpJDS4NFNnRTdZlme1NjcOZkYwhVW44UOhhlTEh3aPpFUxNTckZGdu12duZEV5YzSvoXbvs0RuJmMoZmYLVHNSJTZpZkV3YXZP1EWzVmTrlXTYtkZWdGNhdjUil0M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=0F2c4QncLZ3aNZlSH5mTzljcZR3dEVzdMN3byknMxgGSMZ1Z1VmTQdmdrMDWvN3KMV2YKRWcnRXaldlWj9yMFNEZnVlayNUQLVlTyI2VU1UOWlHTtdkTFllZ0gmSRJTYFlGMJtiUQpWZ3N2QxwmQuJlYaplezIFe&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=5NUczh2SGd1V1UFV5JUcZZGMqtmTjRVV4UnaTRHb5ckch9WSRRXVIplM2Y3d1onUSpWMG9kaHxkT5d0Y1NTUsN1VzFjepBTZuN1VHJ0VyQlUlJGc4dTYvBjdwcXNT5UMrtEMXZWQqF3UNlGUrIjMMdDRThVRlFGW&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=4JzYLdVU3cDV4JzTEhWNaR0d3V1b0ITekF1SUljdHljaYpWWKZEZvMkYvk3NuZkUqNDNYJXTJB3Z2RlaBpme4tkMRREZvNHbihGai9idSp3UaNmcVhUQB9SNpJGbudFd51GSylmYKRWN1xkYSR1NSt2d1MjMvEHS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TezNVO2wmM4kGM112KPZVd1UkSSNUdOx0LMZ2UqR1Sv50RxA1MKZXMh92SrpFeptkcv5EeKFWcy9Gc=0TQvBXdKZzTRl2bYFFbHZkMCJlUvVlNvFTOvNjdTJUZ2wGZm9CO0BlWppkS4hHdh1WWmd2NWZ1NYh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RhXRil1Q4gGRVBjb38SOtFEZpNmMXpmVqtCOXZFTB50QBpXOwZmcOJzbHRkb19yMwEzdnRVYkZ1bRxmeXBFbxgWb0s2dvsmNiZ0S3RXaDp1L4MDSKlFdldFR0hlb4sEexdzMPZFcOZVMwFHeP1kRjlDOjFVZQJ0L&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mWyBHO08UbGlURGRFVXd0MvJnQ3FkdmhTdoJ3UzMXesxUexJURh10LlVjU2UFNBJkSz9GTmpHSNl3R=0TVEB1bVd2VPJXOxYnUMJXZXt2dh9yQEd1L2sWazljcNlTVFp1R4kkcZhUYsRDOQdDWr1WWCh2UhJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=HRvJUVLR2TBVVc0NUZYpEWIhFZZVDbY9EatJTUNpHdxhkUpZ3dJpFUrwmQyF1VIFXTrZ3ZIVnRkZXU=0DN1UkUJd0ciVTRkZXazNza3QjdhJUQzcETmpGSQFWbslWU2ETe6tkd2glZkJVeklWaulEardTWHV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=GbDpEWRhEWWhjSK50chlHMyJTeXNkRWRkQSNERsVDRSBzRhZnM4Q0LnR2bx8iSLdTckllUChFUal0V=0DNzoGSX1EWvVmRrFlN6J3LINzKhxGW5glQ2Q1ZwUXeIVkWzomZIJFS24mNjVDeyADeSZ1T3MDMxt&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=utGclRHbZNle2czNiNER5BXZDVHOBx0VRZkejJVTsF1Yv8UZjlXUUBFajZFeSxUbGRzb3UWdkRlTwZ0ZDNHb4YHdwInM5d3Rwt0VDljeyxEOnB1UwgjS3tWZqpkYV9mYjRmdltmc0ImZUhUQKRDS1kHZZJ3T6JzL&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=hVmUxUEb0B3dZhHRXZ2YHB3LvFkbkB1VU9EO5hmeLd0VsxkcpFXZnd3N5gHUlN0LCZDZqJkZlVUWtFWbERkRzZXYl9ERRlzblVndSZkQhVETRp0N5F1TJ9kZkRnd5wmNwplbaljexFkR0JmQ2R2ZydDcm9iVaRzK&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ES1tGcwd2YwMUUQVDWkpnevYDbzxWTQNTdnRkSlljWGl0N5s0cFd2V3BzQEF2djN2SrZVUZhmcp5Gd=0TWIlkal10TTxWZ5IlZoZWNnlFd5MDNL50R21WUXdDOvoHV2k1KQd1RKlTVKZTcFhUZ1omYJZzQtl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1QGZkZrplQWFFbZNUTrknbTVkRZBHZ0YEbiJVcsN0YNJEW2EWSLV2LFllarZTNxkmbhdkS5J0VDh1d=0DMIVUO10WWEJGN1okbyVFbwQmdshTS3EWWvkFahdWd4wGeVlGOXt2V1knbMdGWOhHTP9CS5p1cxc&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FRUxmVDlHdll0Z0F2YnZDaRdGbn5WRQlFMw42ZVlVSZp1bwNkbPR2NNNFN2YVcHFHTiJWbCR2b6tGR=0zcvgEMvRFUwpGb1k2bkBjbmR0TyVWTrskNLZDT2kTT500NDNTOwUjN00EMzYkeC9yUwNVTqJzTBJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zQ6FlNYhFc0Njc0o2ZYVVUoVmVKNWVrYnU3FVbotmSsVnd1YDV1UkRwVjR38WdnhnZUVVZidXViV1R=0zYa1UYCN1UsFzaOp0Z2czQjFVTyQ0aORUdsR1U3o1crhTZL50QtBVTzAHaChWQDpXa3JVSOVnd1A&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zQ6FlNYhFc0Njc0o2ZYVVUoVmVKNWVrYnU3FVbotmSsVnd1YDV1UkRwVjR38WdnhnZUVVZidXViV1R=0zYZpUYCN1UsFzaOp0Z2czQjFVTyQ0aORUdsR1U3o1crhTZL50QtBVTzAHaChWQDpXa3JVSOVnd1A&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=6pHW5BVNUFXT41GOLJUd3dlYC9GdwE2TJtWS3hzQsh0KnBDaBp3K1ZjZ1IDMphWOpxEU0BHUjpVbYhmTNd2SyVza5sUNvFHNmF3Y0s0SmlTV0gzQGd2cL12QYdzd1UEOr42LiZzUJB3MmBXcvV0LPFGdxYGSTdme&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=M5kaI9kdqVTVyp1VwsmYXdmN3gGSMtCTpx2SUlUNtVDb5xWVVZDaKRHMqpkVPZ3SVd3dMd3c3Z1YvV2VqRXR4EmZwBFS3VWeJZXS1NES3Z1KlNmNkxGOwgDNZN3UhRjNxxkSqF0Q2onYnZUc1tiaa9SW5MlY4RDO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=X5UOB9UdoZVOBpXNkNWR142VZZTWENlYOFGbLNTaQNUUSp0bCNzdtFEO2kDelRGdVZ3VwM0TZFVYFN2Za1kU34GTwgWYXpmTaZEVzF0Q2Ene5o2ROZWQupXaRF1d612MzhzaLdXQUJFSUZGR5MDTyZTVRF3d2MGd&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=pZmbON3dmRGNWhkao1ENoV2NV9SQvt2Z4cjTolXYrBTayg2ZIdnR4gXaxAjW2B3QGp1ROhVehJEdCdnb6J0SYV2VjFXN3Q2ZZpEToZ3YXR0dhNUWEJWa6ZUZ0lzQjtSNyUkdzFmM3IXRysSOwg0bzA3QTNUVVhnQ&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zKvsCVONmYEZndjtUUCVkU3g2SptmWUpkZphlakpGdOFWajtWd0RnR1RUW0kzZrp3S4ElcCVVWkpVc=0zYNtEaoF1UmJVONJGNS9GOudFOpZkZDN3Kl9yRxATQx5kUmVTQHhzQM9mdvFUQvp3NZVWZw0WR5Q&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=EBHTEJGN0lXWGljbhFlUaJnYmJ3NFlFT2Uje4smYpVFeRdUaBNnRVh3RwJXeulkRSN3cJx2Y1hncaVHe0IHWQFjdxMnVolDOkJEZaZ1aPB1QRZzLDpWWqZDOUlEeqx0RBp3RKR3cJtkdRZ1Q3BXd2BTaz4ETGRVO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FFHN5l0MRtkNSpmc28iUOV0L5UVbXFTV1IUbOFzSvMWWyJGNTZFZodWVVFmew9yY5MHOwgkT3F2QWdER0lUb2InSy5EcSJVUVRWdWFWTQhTTapFbwMFMoJFaXp1MU92aWJDVNVlV5Q3Y3Yle3hmV3ZWWQhWT5ZFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=Wa55kcrs2cCFzVQpme1M0M1VTUDRHZMh3dKZXRGd0Tzg0TXVmaNp2Ms9yUHljR6ZnNDNnRXRHawJ3R=0zczNkSHFnQWdFMslWO5hkSjljTJNTQIhDbGRDSzo1Y2wUSk9icjd1RhlVeMZTaz4EaNpkayNVMjp&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=MlHO0UWNHV0bYVlVrcXO0lnY6lmaqp1NoBXZaJ1NCNTV5UXNmFGczh1TLVlR3kleVRTYl5UcZdletVkT6F3YhJUWPZTarhEO4Fjc3hjehRWVjFFViZ3UodTYTZUNFJ3VZl1Q5sCVWVGWBZ0SmtEcL1kd2l2dmZES&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=3N4okQ2MkRwxGcwoHRNpGdkZEZ5FXc0pXdDhHdwMWYQt0N2sieVVjbDh1coBFcDFXWTlGVah0SpFFV=0zd5NUTxFDeD1mVVpHTYR0ZvsSNZl2MPREbpFDNypGV0d3TL5Ue0MzaS9UYwYFMvZ3Mxl3K1MEUiB&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=3cyF2RwoHVDBTNZJlRwxWcGZmU4cDbwpEMY9UWaxUTr8keW9mUk5GUSxkWxoHNlNEZyQFTzNFeDJEW=0zZZRDcCtiVuxWUhp0bH5meR12RtZ2K1tWbOdGWYZjdwBXbKdmSkNWanpFd140RXVVZ0c1MMhjdOB&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=iF1LN92TvsWMLlFOjl2bVhFVuN3U1FVcYJHSHp0RrdkVkFHUI9SZ5MmcM1UdQhXTiVVNxh3d0RUS69EZhR0YVljTGZHcDlkTV9EVyYXZU5kWxEGcGZHWthkUVZmQaJEMJNlQoFWZ6dXUPJDMqZUTMljRrQHaK9We&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=6dEa5dDN1sCZkl0TstEdHZ0dyg0Q4IHM6N3dkt0Rp9mMGZFMvNHb3oUc5M1MLd0KGBVdJRUYXp3RYxkbrE0a5BnS0xETphFWrlTe3dHOxF0cVJHM0J2TUREaJV2RVJzcxR0NTh2TwIVR5JETZlzY6FUURBlTMZ1Z&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DcJ12T4h2TtRVRyAFbSJHb5NER4YXeW9SOl5EevA3TDhTOwgzKTh1cxx0Kr9iUkZmQapER5VXRvlEe=0zcahWbmlEOihDOrpUYvhTeWVkaaRDZohkejV0U2NUQsNHRIZmdpJ1chdTSQZWQP12M0o2KTh1KHV&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=wFmalJXa0ZHMxonaPZFe2B1U1J1TWZ2dJtWYoN1N4MWNXJDTTRTWtBTSXFXWDl2cyQHSpV2ZylFUrRGR5lXTyhXTLpmWkVXYip1VpBVepVzbRB3V2sSN11mMVlUba9mYvUUW2E0MmNXNvVDNlZkUptieWdDcItGS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=kTxwEd51EZOZDOyJGNy52RJ1ESsB1U5d3MHZ0ZklkeVtyMNV0NDRHZ4NDMkdXZkZjVsRnSURVTCFmT=0zcxonUWt2QnFkSK5WMGl0ZC5WWBd3aB9WSBlkevU3T3RlcFN1dDZUQ3k0Lkp1LIZEaKlkW1Z2dzV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ya1NkTrFDMKVkQlVUezhzZ2lGd3lWSSZWWxJVY5QTaxgXeEJEMBB1S3kGNHhWUsJmdFpnb3B1SahFW=0zb40mW2hnM0l3YHdna4dDbXlmRJl2SSRHcBZlaGBzQxpUdy4maXJWSBBTNxYjMZx0YxRFb4UXWV9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=4gkVZlXaZFjdxwGTnJmVYZVMRNkU09WRxU1Rw5UUCVTZhB3L6RENzBDNM9CaydFUZhWbyFGdSdHVthmbhZ2UrM3MjJmVF1Ec0Q0N38kR4JmRtZHR51UTEd0LFFHORJUT4g3YsZVRYZVNkJ1SHJlR3pGVqRnSJNFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=hJ2cQFXQwQmNqJHO0QmaGBjT6pWdBdjbPlUONpWTtN3cVpXSrNWeHllVWRzRoF2bzgnYypFUVN0dmBlQ0lFcuJkSpNnWJxmZNhFM1gkcJxkWTdUbFtUaGdlY3ljQ3N3bzEnbU9yMIhjY2lGUOJjNwNGVjRjRFNHS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=qFjRvdHeEZTOWV3bmVHO20UajVTYrVUUzklSVh0TmVTNwMHaKd2KDJjT1QTNxV0avN0TptESuZ1a6JXRIlWbiZmUwglYZhnZtBVZpJFOZhFZEFlMYtiVlhWZFlXexFUTsFHbV9SU4hDOZNGNmhleHh0VaF2T4QnT&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=lSxZVO0c0YvVnV1J0SPJVa1oVTop3cux2R0wEVEFESqZ2YXB3LnpGdjBlS1N2S6J2UhZ2cvdUd210S=0zaQRXcWJjeYlGTyIVRJNnN0N1ZyxkcoVHV4l3YEJERoxGTo1UdJZVYP9yMr5GVDhHZkFVM4QXQwU&tablename=CJFDAUTO&dflag=pdfdown']"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "session = HTMLSession()\n",
    "\n",
    "pdf_links=[]\n",
    "\n",
    "for url in links:\n",
    "    r = session.get(url)\n",
    "    pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "    pdf_links.append(pdf_link_xpath)\n",
    "pdf_links"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['https://kns.cnki.net/kcms/download.aspx?filename=rYGVSFGZQhUTshVdVl2MiJXWLVVVZlVZ6dTdQhFNSdzMFRnS1p0TsxmNQN2NyIDZCJ3RWx0bQJlbWZ1YY1kbxZkSrFDVvRzSZF0KFRWRzQjQ3NWb4hXRPdFTwZjQycGVZpWa3M0Tv9iRL9yLUJ0QpVWRthzRutmR&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=P9kQZt0d3JVTnBnUolDej9iTZBleKV0ZO9GMZpWQ5pmRxQjbv5WR0QVb1EzTH9kSGRVVK9mURVXeSlWaPtCOlFkZ5pWdVtCTxgVW0NTOnZzQkNDcDVnaYp0NIZmdmBlNLpmWmlXQJ1Ec3o3TCRndhRTQXRkaCl0Z&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=xcDbhFHcLpHaLNWeadGU0cXMvdDT1lGM0IDbw9kb2BTSjJ0LDpHOVdkT61mVDpFbOBFZTt0QLZWUPZHcnpkWrMlYyMmMmp0dr5mYvlzcSNEaRVXMv9iUsJWS28mS2gDWhZVS2J2atJXYmVVTGxkM2gjTXRDcEp2L&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=a50YwI3UxR0VLBXSjRkclBzMMFVWiNGbVFzT0NmS1dHSPlDRnlXMykTUXRkQ1dTaZp2YOVndsFndpZ2cuZmRtt0SVBjVlB3QN9EUjFmMWRXeFh1USh0KjNzNORVWwk0bw92TxtSaCdDZLtUYlNkYrR2dyUEdJtmb&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uNHTpRDd2cUcWplaOZ1R3Ynd502LzRWa3U0QrRDVppXczc2aLVVR2J2NvR1d2sUNFZzUpFlZtJ2TlNneo9SUwp3N4VzdLBTamRzKKZXOPlneuZHdwsmdkBjcMlnQURjSHdzMDd0QaRWYp5GOXBHNIB3Q2c1bRF2T&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=udEa1ZET0wkNSBjTxx2YJtWUkBleDtWdqlXdBlmb4M1dOJmeHZmZ2VDTQh3ctVWNXpEO4IUWO1GdHN2QHNDRVZWOvR2aWRTT3YGO4c1aqlTaLZ3LRp0T1YGMsJlR0dUb080RqZjUJZ2Mw8WVKBVYtJ0T5AjM1kGV&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=VFDMyk0Z0MHRNlnbMN3T4lTeTVHOmlDNTtiRPFGRBlkW1tSW4hHcBZ3dl9iQPp0aJp1LJhkQwhmcYFWTpZUYRFTT4NmN1F2bLN1VkVTSslEarcVS0g3KHdWd3pHN2Q2L0RXbYlHe4g1TyV3Z4czd2F1Z65WSHhFU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=vJXb6Vzd0MnaT9UN0Y1b3EHRkJDR2xEZSFWZRpUOih3ZOljUxcGSStyLv42aoNnYiZzVVpXdJJEWytEUHJmRwFkZBhFNLZDZKVTdLpWSsV2M4F0NQ90aQBXe1J2LNFDTmlFNWhUQlNkaxpnbQJ0TSV0K1MVdJpmN&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=CZlMWdlRzBnZx1maCl1YHd3QrZXMHVzNYd2RMdlWVNTQwVzZ1BXYMBnYYh0b6JFS5N3YrZFWKxGcuh1V2pmbwlje0pkQBxWbWRTdFdlbItiWkxkUrR2MHRETpVjQsVkZOVzYPB3YPpUYqdFUIFTM5J2LVl0MztWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=YpFbktEWil0UMh1SRFkYN9kesRTSipUUFhWUKRDMmFEW0cGRuZkSYVGbygjN582RsBXMCFHSM9kQrt2Y2N1Sll1bRpGRll3QqVGbo9EU0JENuV0KNVka5hzLwoGTkpGUCNTO6ZkaEZTRF5mboRjU1EDUOlzNFJkR&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=htGe28kYx9iaro1QTNHTOR3dqRUczQVO5U0QHVzQsdTdF52VNRWUQ5mMnVkR3UXa2FmcldHbutUeJhWbwVnT6RDW0ZFcNNUMotWTohkTnljZzJmQwUFayBXMxFDR6tGOyo3U6RGVDt0LCN1YvYmYixEeztUdKZDO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=iZzYWR0bE52ZER0Qzkjb1YEWuR1LjR0Zm9yUVFUavhVOoFDbCRGVHl3UrtmTrcFb0o0SIJ1aqJUdwJ2RM5EcwEkQmx2cwIVRXdGdKNjQ2oXYFl3SBd3dBRjVQJkV2EHTyJ1bqFkVWh1NEdUa6lXcTtyUXhnRSdnR&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mNUMuh1ZvokQvkGZzRHdI5UZ3FTRx1URUBHTrQ0NMdDbCZVZIFESXdTRnVWThR0aYFGW20WVsZWRtdXTId2avZHe4RTeJh2LOdEe2JFa3NmMY10Kzs0dsNTYSp0R0lmWGd0ZMJje3UVYzN0ZVl2YrwkY5kkSjx0K&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=Nt2VRd3KohTa3FVboVTNyJVY0R3cFNDMENnVpJDS4NFNnRTdZlme1NjcOZkYwhVW44UOhhlTEh3aPpFUxNTckZGdu12duZEV5YzSvoXbvs0RuJmMoZmYLVHNSJTZpZkV3YXZP1EWzVmTrlXTYtkZWdGNhdjUil0M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=0F2c4QncLZ3aNZlSH5mTzljcZR3dEVzdMN3byknMxgGSMZ1Z1VmTQdmdrMDWvN3KMV2YKRWcnRXaldlWj9yMFNEZnVlayNUQLVlTyI2VU1UOWlHTtdkTFllZ0gmSRJTYFlGMJtiUQpWZ3N2QxwmQuJlYaplezIFe&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=5NUczh2SGd1V1UFV5JUcZZGMqtmTjRVV4UnaTRHb5ckch9WSRRXVIplM2Y3d1onUSpWMG9kaHxkT5d0Y1NTUsN1VzFjepBTZuN1VHJ0VyQlUlJGc4dTYvBjdwcXNT5UMrtEMXZWQqF3UNlGUrIjMMdDRThVRlFGW&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=4JzYLdVU3cDV4JzTEhWNaR0d3V1b0ITekF1SUljdHljaYpWWKZEZvMkYvk3NuZkUqNDNYJXTJB3Z2RlaBpme4tkMRREZvNHbihGai9idSp3UaNmcVhUQB9SNpJGbudFd51GSylmYKRWN1xkYSR1NSt2d1MjMvEHS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TezNVO2wmM4kGM112KPZVd1UkSSNUdOx0LMZ2UqR1Sv50RxA1MKZXMh92SrpFeptkcv5EeKFWcy9Gc=0TQvBXdKZzTRl2bYFFbHZkMCJlUvVlNvFTOvNjdTJUZ2wGZm9CO0BlWppkS4hHdh1WWmd2NWZ1NYh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RhXRil1Q4gGRVBjb38SOtFEZpNmMXpmVqtCOXZFTB50QBpXOwZmcOJzbHRkb19yMwEzdnRVYkZ1bRxmeXBFbxgWb0s2dvsmNiZ0S3RXaDp1L4MDSKlFdldFR0hlb4sEexdzMPZFcOZVMwFHeP1kRjlDOjFVZQJ0L&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mWyBHO08UbGlURGRFVXd0MvJnQ3FkdmhTdoJ3UzMXesxUexJURh10LlVjU2UFNBJkSz9GTmpHSNl3R=0TVEB1bVd2VPJXOxYnUMJXZXt2dh9yQEd1L2sWazljcNlTVFp1R4kkcZhUYsRDOQdDWr1WWCh2UhJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=HRvJUVLR2TBVVc0NUZYpEWIhFZZVDbY9EatJTUNpHdxhkUpZ3dJpFUrwmQyF1VIFXTrZ3ZIVnRkZXU=0DN1UkUJd0ciVTRkZXazNza3QjdhJUQzcETmpGSQFWbslWU2ETe6tkd2glZkJVeklWaulEardTWHV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=GbDpEWRhEWWhjSK50chlHMyJTeXNkRWRkQSNERsVDRSBzRhZnM4Q0LnR2bx8iSLdTckllUChFUal0V=0DNzoGSX1EWvVmRrFlN6J3LINzKhxGW5glQ2Q1ZwUXeIVkWzomZIJFS24mNjVDeyADeSZ1T3MDMxt&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=utGclRHbZNle2czNiNER5BXZDVHOBx0VRZkejJVTsF1Yv8UZjlXUUBFajZFeSxUbGRzb3UWdkRlTwZ0ZDNHb4YHdwInM5d3Rwt0VDljeyxEOnB1UwgjS3tWZqpkYV9mYjRmdltmc0ImZUhUQKRDS1kHZZJ3T6JzL&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=hVmUxUEb0B3dZhHRXZ2YHB3LvFkbkB1VU9EO5hmeLd0VsxkcpFXZnd3N5gHUlN0LCZDZqJkZlVUWtFWbERkRzZXYl9ERRlzblVndSZkQhVETRp0N5F1TJ9kZkRnd5wmNwplbaljexFkR0JmQ2R2ZydDcm9iVaRzK&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ES1tGcwd2YwMUUQVDWkpnevYDbzxWTQNTdnRkSlljWGl0N5s0cFd2V3BzQEF2djN2SrZVUZhmcp5Gd=0TWIlkal10TTxWZ5IlZoZWNnlFd5MDNL50R21WUXdDOvoHV2k1KQd1RKlTVKZTcFhUZ1omYJZzQtl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1QGZkZrplQWFFbZNUTrknbTVkRZBHZ0YEbiJVcsN0YNJEW2EWSLV2LFllarZTNxkmbhdkS5J0VDh1d=0DMIVUO10WWEJGN1okbyVFbwQmdshTS3EWWvkFahdWd4wGeVlGOXt2V1knbMdGWOhHTP9CS5p1cxc&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FRUxmVDlHdll0Z0F2YnZDaRdGbn5WRQlFMw42ZVlVSZp1bwNkbPR2NNNFN2YVcHFHTiJWbCR2b6tGR=0zcvgEMvRFUwpGb1k2bkBjbmR0TyVWTrskNLZDT2kTT500NDNTOwUjN00EMzYkeC9yUwNVTqJzTBJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zQ6FlNYhFc0Njc0o2ZYVVUoVmVKNWVrYnU3FVbotmSsVnd1YDV1UkRwVjR38WdnhnZUVVZidXViV1R=0zYa1UYCN1UsFzaOp0Z2czQjFVTyQ0aORUdsR1U3o1crhTZL50QtBVTzAHaChWQDpXa3JVSOVnd1A&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zQ6FlNYhFc0Njc0o2ZYVVUoVmVKNWVrYnU3FVbotmSsVnd1YDV1UkRwVjR38WdnhnZUVVZidXViV1R=0zYZpUYCN1UsFzaOp0Z2czQjFVTyQ0aORUdsR1U3o1crhTZL50QtBVTzAHaChWQDpXa3JVSOVnd1A&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=6pHW5BVNUFXT41GOLJUd3dlYC9GdwE2TJtWS3hzQsh0KnBDaBp3K1ZjZ1IDMphWOpxEU0BHUjpVbYhmTNd2SyVza5sUNvFHNmF3Y0s0SmlTV0gzQGd2cL12QYdzd1UEOr42LiZzUJB3MmBXcvV0LPFGdxYGSTdme&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=M5kaI9kdqVTVyp1VwsmYXdmN3gGSMtCTpx2SUlUNtVDb5xWVVZDaKRHMqpkVPZ3SVd3dMd3c3Z1YvV2VqRXR4EmZwBFS3VWeJZXS1NES3Z1KlNmNkxGOwgDNZN3UhRjNxxkSqF0Q2onYnZUc1tiaa9SW5MlY4RDO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=X5UOB9UdoZVOBpXNkNWR142VZZTWENlYOFGbLNTaQNUUSp0bCNzdtFEO2kDelRGdVZ3VwM0TZFVYFN2Za1kU34GTwgWYXpmTaZEVzF0Q2Ene5o2ROZWQupXaRF1d612MzhzaLdXQUJFSUZGR5MDTyZTVRF3d2MGd&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=pZmbON3dmRGNWhkao1ENoV2NV9SQvt2Z4cjTolXYrBTayg2ZIdnR4gXaxAjW2B3QGp1ROhVehJEdCdnb6J0SYV2VjFXN3Q2ZZpEToZ3YXR0dhNUWEJWa6ZUZ0lzQjtSNyUkdzFmM3IXRysSOwg0bzA3QTNUVVhnQ&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zKvsCVONmYEZndjtUUCVkU3g2SptmWUpkZphlakpGdOFWajtWd0RnR1RUW0kzZrp3S4ElcCVVWkpVc=0zYNtEaoF1UmJVONJGNS9GOudFOpZkZDN3Kl9yRxATQx5kUmVTQHhzQM9mdvFUQvp3NZVWZw0WR5Q&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=EBHTEJGN0lXWGljbhFlUaJnYmJ3NFlFT2Uje4smYpVFeRdUaBNnRVh3RwJXeulkRSN3cJx2Y1hncaVHe0IHWQFjdxMnVolDOkJEZaZ1aPB1QRZzLDpWWqZDOUlEeqx0RBp3RKR3cJtkdRZ1Q3BXd2BTaz4ETGRVO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FFHN5l0MRtkNSpmc28iUOV0L5UVbXFTV1IUbOFzSvMWWyJGNTZFZodWVVFmew9yY5MHOwgkT3F2QWdER0lUb2InSy5EcSJVUVRWdWFWTQhTTapFbwMFMoJFaXp1MU92aWJDVNVlV5Q3Y3Yle3hmV3ZWWQhWT5ZFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=Wa55kcrs2cCFzVQpme1M0M1VTUDRHZMh3dKZXRGd0Tzg0TXVmaNp2Ms9yUHljR6ZnNDNnRXRHawJ3R=0zczNkSHFnQWdFMslWO5hkSjljTJNTQIhDbGRDSzo1Y2wUSk9icjd1RhlVeMZTaz4EaNpkayNVMjp&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=MlHO0UWNHV0bYVlVrcXO0lnY6lmaqp1NoBXZaJ1NCNTV5UXNmFGczh1TLVlR3kleVRTYl5UcZdletVkT6F3YhJUWPZTarhEO4Fjc3hjehRWVjFFViZ3UodTYTZUNFJ3VZl1Q5sCVWVGWBZ0SmtEcL1kd2l2dmZES&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=3N4okQ2MkRwxGcwoHRNpGdkZEZ5FXc0pXdDhHdwMWYQt0N2sieVVjbDh1coBFcDFXWTlGVah0SpFFV=0zd5NUTxFDeD1mVVpHTYR0ZvsSNZl2MPREbpFDNypGV0d3TL5Ue0MzaS9UYwYFMvZ3Mxl3K1MEUiB&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=3cyF2RwoHVDBTNZJlRwxWcGZmU4cDbwpEMY9UWaxUTr8keW9mUk5GUSxkWxoHNlNEZyQFTzNFeDJEW=0zZZRDcCtiVuxWUhp0bH5meR12RtZ2K1tWbOdGWYZjdwBXbKdmSkNWanpFd140RXVVZ0c1MMhjdOB&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=iF1LN92TvsWMLlFOjl2bVhFVuN3U1FVcYJHSHp0RrdkVkFHUI9SZ5MmcM1UdQhXTiVVNxh3d0RUS69EZhR0YVljTGZHcDlkTV9EVyYXZU5kWxEGcGZHWthkUVZmQaJEMJNlQoFWZ6dXUPJDMqZUTMljRrQHaK9We&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=6dEa5dDN1sCZkl0TstEdHZ0dyg0Q4IHM6N3dkt0Rp9mMGZFMvNHb3oUc5M1MLd0KGBVdJRUYXp3RYxkbrE0a5BnS0xETphFWrlTe3dHOxF0cVJHM0J2TUREaJV2RVJzcxR0NTh2TwIVR5JETZlzY6FUURBlTMZ1Z&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DcJ12T4h2TtRVRyAFbSJHb5NER4YXeW9SOl5EevA3TDhTOwgzKTh1cxx0Kr9iUkZmQapER5VXRvlEe=0zcahWbmlEOihDOrpUYvhTeWVkaaRDZohkejV0U2NUQsNHRIZmdpJ1chdTSQZWQP12M0o2KTh1KHV&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=wFmalJXa0ZHMxonaPZFe2B1U1J1TWZ2dJtWYoN1N4MWNXJDTTRTWtBTSXFXWDl2cyQHSpV2ZylFUrRGR5lXTyhXTLpmWkVXYip1VpBVepVzbRB3V2sSN11mMVlUba9mYvUUW2E0MmNXNvVDNlZkUptieWdDcItGS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=kTxwEd51EZOZDOyJGNy52RJ1ESsB1U5d3MHZ0ZklkeVtyMNV0NDRHZ4NDMkdXZkZjVsRnSURVTCFmT=0zcxonUWt2QnFkSK5WMGl0ZC5WWBd3aB9WSBlkevU3T3RlcFN1dDZUQ3k0Lkp1LIZEaKlkW1Z2dzV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ya1NkTrFDMKVkQlVUezhzZ2lGd3lWSSZWWxJVY5QTaxgXeEJEMBB1S3kGNHhWUsJmdFpnb3B1SahFW=0zb40mW2hnM0l3YHdna4dDbXlmRJl2SSRHcBZlaGBzQxpUdy4maXJWSBBTNxYjMZx0YxRFb4UXWV9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=4gkVZlXaZFjdxwGTnJmVYZVMRNkU09WRxU1Rw5UUCVTZhB3L6RENzBDNM9CaydFUZhWbyFGdSdHVthmbhZ2UrM3MjJmVF1Ec0Q0N38kR4JmRtZHR51UTEd0LFFHORJUT4g3YsZVRYZVNkJ1SHJlR3pGVqRnSJNFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=hJ2cQFXQwQmNqJHO0QmaGBjT6pWdBdjbPlUONpWTtN3cVpXSrNWeHllVWRzRoF2bzgnYypFUVN0dmBlQ0lFcuJkSpNnWJxmZNhFM1gkcJxkWTdUbFtUaGdlY3ljQ3N3bzEnbU9yMIhjY2lGUOJjNwNGVjRjRFNHS&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=qFjRvdHeEZTOWV3bmVHO20UajVTYrVUUzklSVh0TmVTNwMHaKd2KDJjT1QTNxV0avN0TptESuZ1a6JXRIlWbiZmUwglYZhnZtBVZpJFOZhFZEFlMYtiVlhWZFlXexFUTsFHbV9SU4hDOZNGNmhleHh0VaF2T4QnT&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=lSxZVO0c0YvVnV1J0SPJVa1oVTop3cux2R0wEVEFESqZ2YXB3LnpGdjBlS1N2S6J2UhZ2cvdUd210S=0zaQRXcWJjeYlGTyIVRJNnN0N1ZyxkcoVHV4l3YEJERoxGTo1UdJZVYP9yMr5GVDhHZkFVM4QXQwU&tablename=CJFDAUTO&dflag=pdfdown']"
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 完整链接\n",
    "pdf_href=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "pdf_href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>智能化测绘的基本问题与发展方向  网络首发</td>\n",
       "      <td>陈军; 刘万增; 武昊; Songnian Li; 闫利</td>\n",
       "      <td>测绘学报</td>\n",
       "      <td>2021-07-06 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>国土空间开发适宜性评价的理论、方法与技术应用  网络首发</td>\n",
       "      <td>刘小波;王玉宽;李明</td>\n",
       "      <td>地球信息科学学报</td>\n",
       "      <td>2021-07-06 15:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发</td>\n",
       "      <td>李燕云;王永明;周奇;李亦学;王振</td>\n",
       "      <td>复旦学报(医学版)</td>\n",
       "      <td>2021-07-06 15:53</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>铁路盾构隧道智能建造技术现状与展望  网络首发</td>\n",
       "      <td>陈丹; 刘喆; 刘建友; 房倩; 海路</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-07-06 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发</td>\n",
       "      <td>郑翔; 山茂峰</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-06 15:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>互联网旅游统计体系初探  网络首发</td>\n",
       "      <td>刘冰洁; 李倩; 赵彦云</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-07-05 17:36</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>基于处方序列与处方序列对称分析的中药药物警戒  网络首发</td>\n",
       "      <td>吕健; 王连心; 谢雁鸣</td>\n",
       "      <td>中国中药杂志</td>\n",
       "      <td>2021-07-05 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>大数据金融：小微企业金融服务的创新与思考  网络首发</td>\n",
       "      <td>丁廉业</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发</td>\n",
       "      <td>陈游</td>\n",
       "      <td>西南金融</td>\n",
       "      <td>2021-07-05 15:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>三支决策在工业大数据中的应用  网络首发</td>\n",
       "      <td>于洪; 杨雪梅</td>\n",
       "      <td>西北大学学报(自然科学版)</td>\n",
       "      <td>2021-07-05 14:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发</td>\n",
       "      <td>张艾荣; 吕娜</td>\n",
       "      <td>软科学</td>\n",
       "      <td>2021-07-05 13:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据时代中国共产党的形象建构：挑战与应对  网络首发</td>\n",
       "      <td>苏玉波; 刘婷婷</td>\n",
       "      <td>西安交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-05 13:37</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>电子信息领域硕士研究生工程伦理课程建设  网络首发</td>\n",
       "      <td>周林娜; 常俊林; 代伟; 杨春雨</td>\n",
       "      <td>控制工程</td>\n",
       "      <td>2021-07-05 13:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>中国经济发展规律与理论研究关键科学问题  网络首发</td>\n",
       "      <td>刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发</td>\n",
       "      <td>王琳; 赖茂生</td>\n",
       "      <td>中国图书馆学报</td>\n",
       "      <td>2021-07-05 11:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发</td>\n",
       "      <td>叶晗;吴博文;许红卫;干牧野;张晶</td>\n",
       "      <td>浙江农业学报</td>\n",
       "      <td>2021-07-05 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>基于靶向最大似然估计模型在高血压药物疗效评价中的应用</td>\n",
       "      <td>潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 09:15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例</td>\n",
       "      <td>丁雄;蒋蔚;蒋静;胡跃华;武英</td>\n",
       "      <td>中华疾病控制杂志</td>\n",
       "      <td>2021-07-05 08:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>计算机技术在储能系统中的应用研究</td>\n",
       "      <td>李骏; 杨雅志</td>\n",
       "      <td>储能科学与技术</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>面向代码相似性检测的相似哈希改进方法</td>\n",
       "      <td>李玫;高庆;马森;张世琨;胡文蕙</td>\n",
       "      <td>软件学报</td>\n",
       "      <td>2021-07-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发</td>\n",
       "      <td>马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜</td>\n",
       "      <td>地球科学进展</td>\n",
       "      <td>2021-07-02 15:58</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>大数据背景下档案信息服务体系构建方法探析</td>\n",
       "      <td>孔媛媛; 张舒; 王爱</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 09:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>数据赋能教育治理创新:内涵、机制与实践</td>\n",
       "      <td>张培; 夏海鹰</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>社交媒体大数据的教育应用研究:价值、路径与挑战</td>\n",
       "      <td>李彤彤; 李坦; 郭栩宁</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>大数据时代的科学实在论发展趋向及其特征</td>\n",
       "      <td>刘伟伟</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>健康医疗大数据公平问题研究</td>\n",
       "      <td>李晓洁; 丛亚丽</td>\n",
       "      <td>自然辩证法通讯</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>互联网平台滥用市场支配地位行为规制的困境与出路  网络首发</td>\n",
       "      <td>谭袁</td>\n",
       "      <td>法治研究</td>\n",
       "      <td>2021-07-01 15:17</td>\n",
       "      <td>NaN</td>\n",
       "      <td>27.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>铁路调度集中系统调车作业时间智能预测方法研究  网络首发</td>\n",
       "      <td>韩浪; 王壮锋; 张春德</td>\n",
       "      <td>铁道标准设计</td>\n",
       "      <td>2021-07-01 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>11.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>医院财务智能化转型路径探析  网络首发</td>\n",
       "      <td>刘波; 曾绍颖; 张晓玮; 李琼</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 11:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>数据开放共享与个人隐私保护对策研究——层次数据与算法问责</td>\n",
       "      <td>窦悦</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-07-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>全球主要生态退化区和研究热点区的空间分布与演变  网络首发</td>\n",
       "      <td>张云芝; 胡云锋; 韩月琪; 战胜</td>\n",
       "      <td>生态学报</td>\n",
       "      <td>2021-06-30 10:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>43.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例</td>\n",
       "      <td>王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-30 09:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>地理综合研究方法的发展与思考  网络首发</td>\n",
       "      <td>闾国年;周成虎;林珲;陈旻;乐松山</td>\n",
       "      <td>科学通报</td>\n",
       "      <td>2021-06-30 09:12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>31.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发</td>\n",
       "      <td>张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜</td>\n",
       "      <td>航空学报</td>\n",
       "      <td>2021-06-29 17:19</td>\n",
       "      <td>NaN</td>\n",
       "      <td>52.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>170.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>我国大数据审计研究综述——基于中文核心期刊文献研究</td>\n",
       "      <td>王海洪; 吕登辉; 任美; 王婧; 王盈盈</td>\n",
       "      <td>会计之友</td>\n",
       "      <td>2021-06-29 17:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>119.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>83.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>新时代发挥统计监督职能的思考</td>\n",
       "      <td>李金昌; 余卫</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 15:43</td>\n",
       "      <td>NaN</td>\n",
       "      <td>33.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>近20年长江经济带生态环境变化  网络首发</td>\n",
       "      <td>周权平;张澎彬;薛腾飞;姜月华;郭琳</td>\n",
       "      <td>中国地质</td>\n",
       "      <td>2021-06-29 14:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发</td>\n",
       "      <td>丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-29 14:34</td>\n",
       "      <td>NaN</td>\n",
       "      <td>56.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>基于配网新形态下电费风险模型构建与应用  网络首发</td>\n",
       "      <td>戴璐平; 瞿青; 黄露; 潘晔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 14:00</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>规模以下工业抽样设计研究</td>\n",
       "      <td>万舒晨</td>\n",
       "      <td>统计研究</td>\n",
       "      <td>2021-06-29 11:06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                           篇名  \\\n",
       "0            1                        智能化测绘的基本问题与发展方向  网络首发   \n",
       "1            2                 国土空间开发适宜性评价的理论、方法与技术应用  网络首发   \n",
       "2            3              基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发   \n",
       "3            4                      铁路盾构隧道智能建造技术现状与展望  网络首发   \n",
       "4            5         互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发   \n",
       "5            6                      森林生态站大数据快速存储与索引方法  网络首发   \n",
       "6            7                            互联网旅游统计体系初探  网络首发   \n",
       "7            8                 基于处方序列与处方序列对称分析的中药药物警戒  网络首发   \n",
       "8            9                   大数据金融：小微企业金融服务的创新与思考  网络首发   \n",
       "9           10  我国非银行支付适应性监管：基于鼓励金融创新、公平市场竞争与消费者保护的视角  网络首发   \n",
       "10          11                         三支决策在工业大数据中的应用  网络首发   \n",
       "11          12               大数据能力、服务链整合与政府智慧服务绩效关系研究  网络首发   \n",
       "12          13                  大数据时代中国共产党的形象建构：挑战与应对  网络首发   \n",
       "13          14                    电子信息领域硕士研究生工程伦理课程建设  网络首发   \n",
       "14          15                    中国经济发展规律与理论研究关键科学问题  网络首发   \n",
       "15          16               中国科技情报事业回顾与展望：基于情报学理论的视角  网络首发   \n",
       "16          17     基于地理大数据的省域休闲农业空间格局及其影响因素研究——以浙江省为例  网络首发   \n",
       "17          18                   基于靶向最大似然估计模型在高血压药物疗效评价中的应用   \n",
       "18          19          基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例  网络首发   \n",
       "19          20                基于健康大数据带状疱疹与抑郁症的关系——现实世界的研究实例   \n",
       "20          21                             计算机技术在储能系统中的应用研究   \n",
       "21          22                           面向代码相似性检测的相似哈希改进方法   \n",
       "22          23              国际大洋钻探科学数据的现状、特征及其汇编的科学意义  网络首发   \n",
       "23          24                   金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "24          25                         大数据背景下档案信息服务体系构建方法探析   \n",
       "25          26                          数据赋能教育治理创新:内涵、机制与实践   \n",
       "26          27                      社交媒体大数据的教育应用研究:价值、路径与挑战   \n",
       "27          28                          大数据时代的科学实在论发展趋向及其特征   \n",
       "28          29                                健康医疗大数据公平问题研究   \n",
       "29          30                       智能财务人才培养与浙江大学的探索  网络首发   \n",
       "30          31                互联网平台滥用市场支配地位行为规制的困境与出路  网络首发   \n",
       "31          32                 铁路调度集中系统调车作业时间智能预测方法研究  网络首发   \n",
       "32          33                          医院财务智能化转型路径探析  网络首发   \n",
       "33          34                 数据开放共享与个人隐私保护对策研究——层次数据与算法问责   \n",
       "34          35                全球主要生态退化区和研究热点区的空间分布与演变  网络首发   \n",
       "35          36        基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例  网络首发   \n",
       "36          37              基于知识图谱的审计智能专家模式设计与应用——以国网湖北电力为例   \n",
       "37          38                         地理综合研究方法的发展与思考  网络首发   \n",
       "38          39                              绿色理念下智慧零售创新发展路径   \n",
       "39          40           数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "40          41     基于深度卷积生成对抗网络的缺失数据生成方法及其在剩余寿命预测中的应用  网络首发   \n",
       "41          42              我国大数据审计研究综述——基于中文核心期刊文献研究  网络首发   \n",
       "42          43                    我国大数据审计研究综述——基于中文核心期刊文献研究   \n",
       "43          44                 智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "44          45                       “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "45          46                               新时代发挥统计监督职能的思考   \n",
       "46          47                        近20年长江经济带生态环境变化  网络首发   \n",
       "47          48        科研大数据生态系统:构成要素及关联关系——以极地科研大数据为例  网络首发   \n",
       "48          49                    基于配网新形态下电费风险模型构建与应用  网络首发   \n",
       "49          50                                 规模以下工业抽样设计研究   \n",
       "\n",
       "                              作者               刊名              发表时间  被引  \\\n",
       "0   陈军; 刘万增; 武昊; Songnian Li; 闫利             测绘学报  2021-07-06 16:16 NaN   \n",
       "1                     刘小波;王玉宽;李明         地球信息科学学报  2021-07-06 15:54 NaN   \n",
       "2              李燕云;王永明;周奇;李亦学;王振        复旦学报(医学版)  2021-07-06 15:53 NaN   \n",
       "3            陈丹; 刘喆; 刘建友; 房倩; 海路        隧道建设(中英文)  2021-07-06 15:51 NaN   \n",
       "4                        郑翔; 山茂峰  北京交通大学学报(社会科学版)  2021-07-06 15:03 NaN   \n",
       "5         王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福           农业机械学报  2021-07-06 09:48 NaN   \n",
       "6                   刘冰洁; 李倩; 赵彦云            统计与决策  2021-07-05 17:36 NaN   \n",
       "7                   吕健; 王连心; 谢雁鸣           中国中药杂志  2021-07-05 15:51 NaN   \n",
       "8                            丁廉业             西南金融  2021-07-05 15:20 NaN   \n",
       "9                             陈游             西南金融  2021-07-05 15:20 NaN   \n",
       "10                       于洪; 杨雪梅    西北大学学报(自然科学版)  2021-07-05 14:19 NaN   \n",
       "11                       张艾荣; 吕娜              软科学  2021-07-05 13:38 NaN   \n",
       "12                      苏玉波; 刘婷婷  西安交通大学学报(社会科学版)  2021-07-05 13:37 NaN   \n",
       "13             周林娜; 常俊林; 代伟; 杨春雨             控制工程  2021-07-05 13:04 NaN   \n",
       "14       刘元春; 任之光; 陈彦斌; 杨列勋; 刘作仪           中国科学基金  2021-07-05 11:11 NaN   \n",
       "15                       王琳; 赖茂生          中国图书馆学报  2021-07-05 11:11 NaN   \n",
       "16             叶晗;吴博文;许红卫;干牧野;张晶           浙江农业学报  2021-07-05 11:09 NaN   \n",
       "17           潘凤鸣;赵红玉;吴新莹;冯一平;侯庆振         中华疾病控制杂志  2021-07-05 09:15 NaN   \n",
       "18               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "19               丁雄;蒋蔚;蒋静;胡跃华;武英         中华疾病控制杂志  2021-07-05 08:56 NaN   \n",
       "20                       李骏; 杨雅志          储能科学与技术        2021-07-05 NaN   \n",
       "21              李玫;高庆;马森;张世琨;胡文蕙             软件学报        2021-07-05 NaN   \n",
       "22           马鹏飞;刘志飞;拓守廷;蒋璟鑫;许艺炜           地球科学进展  2021-07-02 15:58 NaN   \n",
       "23                 陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN   \n",
       "24                   孔媛媛; 张舒; 王爱            档案与建设  2021-07-02 09:42 NaN   \n",
       "25                       张培; 夏海鹰           中国远程教育        2021-07-02 NaN   \n",
       "26                  李彤彤; 李坦; 郭栩宁           中国远程教育        2021-07-02 NaN   \n",
       "27                           刘伟伟          自然辩证法通讯        2021-07-02 NaN   \n",
       "28                      李晓洁; 丛亚丽          自然辩证法通讯        2021-07-02 NaN   \n",
       "29                        陈俊; 董望             财会月刊  2021-07-01 15:42 NaN   \n",
       "30                            谭袁             法治研究  2021-07-01 15:17 NaN   \n",
       "31                  韩浪; 王壮锋; 张春德           铁道标准设计  2021-07-01 15:09 NaN   \n",
       "32              刘波; 曾绍颖; 张晓玮; 李琼             财会月刊  2021-07-01 11:09 NaN   \n",
       "33                            窦悦             现代情报        2021-07-01 NaN   \n",
       "34             张云芝; 胡云锋; 韩月琪; 战胜             生态学报  2021-06-30 10:04 NaN   \n",
       "35         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "36         王向阳; 席斌; 胡璟懿; 匡尧; 刘云飞             会计之友  2021-06-30 09:19 NaN   \n",
       "37             闾国年;周成虎;林珲;陈旻;乐松山             科学通报  2021-06-30 09:12 NaN   \n",
       "38                            翟璇           商业经济研究        2021-06-30 NaN   \n",
       "39                           单浩耘           商业经济研究        2021-06-30 NaN   \n",
       "40       张晟斐; 李天梅; 胡昌华; 杜党波; 司小胜             航空学报  2021-06-29 17:19 NaN   \n",
       "41         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "42         王海洪; 吕登辉; 任美; 王婧; 王盈盈             会计之友  2021-06-29 17:09 NaN   \n",
       "43                           乔宇锋             南方金融  2021-06-29 17:04 NaN   \n",
       "44                      解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   \n",
       "45                       李金昌; 余卫             统计研究  2021-06-29 15:43 NaN   \n",
       "46            周权平;张澎彬;薛腾飞;姜月华;郭琳             中国地质  2021-06-29 14:54 NaN   \n",
       "47        丰佰恒; 佟泽华; 冯晓; 石江瀚; 孙晓彬          情报理论与实践  2021-06-29 14:34 NaN   \n",
       "48               戴璐平; 瞿青; 黄露; 潘晔             中国电力  2021-06-29 14:00 NaN   \n",
       "49                           万舒晨             统计研究  2021-06-29 11:06 NaN   \n",
       "\n",
       "       下载  操作                                              详细页链接  \\\n",
       "0     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "5     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "6     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "7     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "8     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "9     NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "10    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "11    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "12    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "13    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "14    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "15    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "16    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "17    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "18    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "19    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "20    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "21    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "22    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "23    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "24    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "25    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "26    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "27    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "28    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "29   53.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "30   27.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "31   11.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "32   19.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "33    5.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "34   43.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "35   43.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "36    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "37   31.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "38   28.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "39   56.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "40   52.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "41  170.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "42    NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "43  119.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "44   83.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "45   33.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "46   58.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "47   56.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "48   23.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "49   28.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                              PDF下载链接  \n",
       "0   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "5   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "6   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "7   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "8   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "9   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "10  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "11  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "12  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "13  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "14  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "15  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "16  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "17  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "18  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "19  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "20  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "21  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "22  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "23  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "24  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "25  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "26  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "27  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "28  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "29  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "30  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "31  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "32  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "33  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "34  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "35  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "36  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "37  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "38  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "39  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "40  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "41  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "42  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "43  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "44  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "45  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "46  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "47  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "48  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "49  https://kns.cnki.net/kcms/download.aspx?filena...  "
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_pdf_links=pd.DataFrame({'PDF下载链接':pdf_href})\n",
    "df_首页=pd.concat([df_首页,df_pdf_links],axis=1)\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 翻页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'下一页'"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element = driver.find_element_by_id('PageNext')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'1/120'"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看上限\n",
    "element = driver.find_element_by_xpath('//span[@class=\"countPageMark\"]')\n",
    "page_str = element.get_attribute('innerHTML')\n",
    "page_str "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16]"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "page_int = page_str.split('/')\n",
    "pages = list(range(1,int(page_int[1])+1))\n",
    "# 设置爬取页数\n",
    "pages = list(range(1,17))\n",
    "pages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [],
   "source": [
    "import time"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t11\t12\t13\t14\t15\t16\t"
     ]
    }
   ],
   "source": [
    "root_group=[]\n",
    "\n",
    "表格_html = dict()\n",
    "main_content =\"\"\n",
    "element = None\n",
    "\n",
    "def page_process(pages):\n",
    "    \"\"\"CNKI翻页获取信息\"\"\"\n",
    "    for p in pages:\n",
    "        print(p,end='\\t')\n",
    "        driver.find_element_by_id('PageNext').click()\n",
    "        time.sleep(15)\n",
    "        \n",
    "        html=driver.page_source\n",
    "        root=fromstring(html)\n",
    "        root_group.append(root)\n",
    "        \n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content\n",
    "page_process(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        html_snippets\n",
       "1   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "2   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "3   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "4   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "5   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "6   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "7   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "8   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "9   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "10  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "11  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "12  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "13  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "14  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "15  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "16  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ..."
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame([表格_html]).T\n",
    "df.columns = [\"html_snippets\"]\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>2020中国情报学年会暨情报学与情报工作发展论坛纪要  网络首发</td>\n",
       "      <td>曹树金; 王雅琪; 赵浜; 卓伊玲</td>\n",
       "      <td>图书情报知识</td>\n",
       "      <td>2021-06-29 11:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>78.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>能源-交通-信息三网融合发展的需求、形态及关键技术  网络首发</td>\n",
       "      <td>何正友; 向悦萍; 廖凯; 杨健维</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-06-28 16:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>81.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>平台视域下全国居民疫苗接种的认知、意愿及影响要素——基于五大互联网平台的舆情大数据分析  网络首发</td>\n",
       "      <td>喻国明; 杨雅; 陈雪娇</td>\n",
       "      <td>新闻界</td>\n",
       "      <td>2021-06-28 15:33</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>健康医疗大数据背景下医院管理的思路、难点及对策</td>\n",
       "      <td>姚德明;翟晓辉;梅翠竹;王栋;张涛</td>\n",
       "      <td>中国医院</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>86.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>大型三甲医院建立数据驱动的科研项目服务模式实践与探索</td>\n",
       "      <td>孙雅婧;李春漾;杨晓妍;辜永红;张伟</td>\n",
       "      <td>中国医院</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>846</td>\n",
       "      <td>基于并行化K-means的综合能源服务客户识别</td>\n",
       "      <td>沈子垚; 袁晓玲</td>\n",
       "      <td>电力工程技术</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>76.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>847</td>\n",
       "      <td>学科想象与理论生长——兼论计算教育学的错觉</td>\n",
       "      <td>吴刚</td>\n",
       "      <td>教育研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>2.0</td>\n",
       "      <td>315.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>848</td>\n",
       "      <td>我科学家研制成功新型可编程光量子计算芯片</td>\n",
       "      <td>NaN</td>\n",
       "      <td>机床与液压</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>849</td>\n",
       "      <td>高素质专业化审计队伍建设研究</td>\n",
       "      <td>上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>850</td>\n",
       "      <td>粤港澳大湾区大数据审计队伍建设研究</td>\n",
       "      <td>广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>198.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                                 篇名  \\\n",
       "0            51                   2020中国情报学年会暨情报学与情报工作发展论坛纪要  网络首发   \n",
       "1            52                    能源-交通-信息三网融合发展的需求、形态及关键技术  网络首发   \n",
       "2            53  平台视域下全国居民疫苗接种的认知、意愿及影响要素——基于五大互联网平台的舆情大数据分析  网络首发   \n",
       "3            54                            健康医疗大数据背景下医院管理的思路、难点及对策   \n",
       "4            55                         大型三甲医院建立数据驱动的科研项目服务模式实践与探索   \n",
       "..          ...                                                ...   \n",
       "795         846                            基于并行化K-means的综合能源服务客户识别   \n",
       "796         847                              学科想象与理论生长——兼论计算教育学的错觉   \n",
       "797         848                               我科学家研制成功新型可编程光量子计算芯片   \n",
       "798         849                                     高素质专业化审计队伍建设研究   \n",
       "799         850                                  粤港澳大湾区大数据审计队伍建设研究   \n",
       "\n",
       "                               作者       刊名              发表时间   被引     下载  操作  \n",
       "0               曹树金; 王雅琪; 赵浜; 卓伊玲   图书情报知识  2021-06-29 11:04  NaN   78.0  下载  \n",
       "1               何正友; 向悦萍; 廖凯; 杨健维  电力系统自动化  2021-06-28 16:32  NaN   81.0  下载  \n",
       "2                    喻国明; 杨雅; 陈雪娇      新闻界  2021-06-28 15:33  NaN  186.0  下载  \n",
       "3               姚德明;翟晓辉;梅翠竹;王栋;张涛     中国医院        2021-06-28  NaN   86.0  下载  \n",
       "4              孙雅婧;李春漾;杨晓妍;辜永红;张伟     中国医院        2021-06-28  NaN   29.0  下载  \n",
       "..                            ...      ...               ...  ...    ...  ..  \n",
       "795                      沈子垚; 袁晓玲   电力工程技术        2021-03-28  NaN   76.0  下载  \n",
       "796                            吴刚     教育研究        2021-03-28  2.0  315.0  下载  \n",
       "797                           NaN    机床与液压        2021-03-28  NaN   54.0  下载  \n",
       "798  上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏     审计研究        2021-03-28  NaN  220.0  下载  \n",
       "799      广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩     审计研究        2021-03-28  NaN  198.0  下载  \n",
       "\n",
       "[800 rows x 8 columns]"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "l_df = []\n",
    "for p in pages:\n",
    "    表格 = pd.read_html(表格_html[p])[0]\n",
    "    l_df.append(表格)\n",
    "df_url_out = pd.concat(l_df).reset_index(drop=True)\n",
    "df_url_out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 详细页链接\n",
    "href_group=[]\n",
    "\n",
    "for root in root_group:\n",
    "    href = root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')\n",
    "    href_group.append(href)\n",
    "    \n",
    "href_group=href_group[0]+href_group[1]+href_group[2]+href_group[3]+href_group[4]+href_group[5]+href_group[6]+href_group[7]+href_group[8]+href_group[9]+href_group[10]+href_group[11]+href_group[12]+href_group[13]+href_group[14]+href_group[15]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "..                                                 ...\n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "\n",
       "[800 rows x 1 columns]"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "href_group_correct=[correct(x) for x in href_group]\n",
    "df_link=pd.DataFrame({'详细页链接':href_group_correct})\n",
    "df_link"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "20\n",
      "21\n",
      "22\n",
      "23\n",
      "24\n",
      "25\n",
      "26\n",
      "27\n",
      "28\n",
      "29\n",
      "30\n",
      "31\n",
      "32\n",
      "33\n",
      "34\n",
      "35\n",
      "36\n",
      "37\n",
      "38\n",
      "39\n",
      "40\n",
      "41\n",
      "42\n",
      "43\n",
      "44\n",
      "45\n",
      "46\n",
      "47\n",
      "48\n",
      "49\n",
      "50\n",
      "51\n",
      "52\n",
      "53\n",
      "54\n",
      "55\n",
      "56\n",
      "57\n",
      "58\n",
      "59\n",
      "60\n",
      "61\n",
      "62\n",
      "63\n",
      "64\n",
      "65\n",
      "66\n",
      "67\n",
      "68\n",
      "69\n",
      "70\n",
      "71\n",
      "72\n",
      "73\n",
      "74\n",
      "75\n",
      "76\n",
      "77\n",
      "78\n",
      "79\n",
      "80\n",
      "81\n",
      "82\n",
      "83\n",
      "84\n",
      "85\n",
      "86\n",
      "87\n",
      "88\n",
      "89\n",
      "90\n",
      "91\n",
      "92\n",
      "93\n",
      "94\n",
      "95\n",
      "96\n",
      "97\n",
      "98\n",
      "99\n",
      "100\n",
      "101\n",
      "102\n",
      "103\n",
      "104\n",
      "105\n",
      "106\n",
      "107\n",
      "108\n",
      "109\n",
      "110\n",
      "111\n",
      "112\n",
      "113\n",
      "114\n",
      "115\n",
      "116\n",
      "117\n",
      "118\n",
      "119\n",
      "120\n",
      "121\n",
      "122\n",
      "123\n",
      "124\n",
      "125\n",
      "126\n",
      "127\n",
      "128\n",
      "129\n",
      "130\n",
      "131\n",
      "132\n",
      "133\n",
      "134\n",
      "135\n",
      "136\n",
      "137\n",
      "138\n",
      "139\n",
      "140\n",
      "141\n",
      "142\n",
      "143\n",
      "144\n",
      "145\n",
      "146\n",
      "147\n",
      "148\n",
      "149\n",
      "150\n",
      "151\n",
      "152\n",
      "153\n",
      "154\n",
      "155\n",
      "156\n",
      "157\n",
      "158\n",
      "159\n",
      "160\n",
      "161\n",
      "162\n",
      "163\n",
      "164\n",
      "165\n",
      "166\n",
      "167\n",
      "168\n",
      "169\n",
      "170\n",
      "171\n",
      "172\n",
      "173\n",
      "174\n",
      "175\n",
      "176\n",
      "177\n",
      "178\n",
      "179\n",
      "180\n",
      "181\n",
      "182\n",
      "183\n",
      "184\n",
      "185\n",
      "186\n",
      "187\n",
      "188\n",
      "189\n",
      "190\n",
      "191\n",
      "192\n",
      "193\n",
      "194\n",
      "195\n",
      "196\n",
      "197\n",
      "198\n",
      "199\n",
      "200\n",
      "201\n",
      "202\n",
      "203\n",
      "204\n",
      "205\n",
      "206\n",
      "207\n",
      "208\n",
      "209\n",
      "210\n",
      "211\n",
      "212\n",
      "213\n",
      "214\n",
      "215\n",
      "216\n",
      "217\n",
      "218\n",
      "219\n",
      "220\n",
      "221\n",
      "222\n",
      "223\n",
      "224\n",
      "225\n",
      "226\n",
      "227\n",
      "228\n",
      "229\n",
      "230\n",
      "231\n",
      "232\n",
      "233\n",
      "234\n",
      "235\n",
      "236\n",
      "237\n",
      "238\n",
      "239\n",
      "240\n",
      "241\n",
      "242\n",
      "243\n",
      "244\n",
      "245\n",
      "246\n",
      "247\n",
      "248\n",
      "249\n",
      "250\n",
      "251\n",
      "252\n",
      "253\n",
      "254\n",
      "255\n",
      "256\n",
      "257\n",
      "258\n",
      "259\n",
      "260\n",
      "261\n",
      "262\n",
      "263\n",
      "264\n",
      "265\n",
      "266\n",
      "267\n",
      "268\n",
      "269\n",
      "270\n",
      "271\n",
      "272\n",
      "273\n",
      "274\n",
      "275\n",
      "276\n",
      "277\n",
      "278\n",
      "279\n",
      "280\n",
      "281\n",
      "282\n",
      "283\n",
      "284\n",
      "285\n",
      "286\n",
      "287\n",
      "288\n",
      "289\n",
      "290\n",
      "291\n",
      "292\n",
      "293\n",
      "294\n",
      "295\n",
      "296\n",
      "297\n",
      "298\n",
      "299\n",
      "300\n",
      "301\n",
      "302\n",
      "303\n",
      "304\n",
      "305\n",
      "306\n",
      "307\n",
      "308\n",
      "309\n",
      "310\n",
      "311\n",
      "312\n",
      "313\n",
      "314\n",
      "315\n",
      "316\n",
      "317\n",
      "318\n",
      "319\n",
      "320\n",
      "321\n",
      "322\n",
      "323\n",
      "324\n",
      "325\n",
      "326\n",
      "327\n",
      "328\n",
      "329\n",
      "330\n",
      "331\n",
      "332\n",
      "333\n",
      "334\n",
      "335\n",
      "336\n",
      "337\n",
      "338\n",
      "339\n",
      "340\n",
      "341\n",
      "342\n",
      "343\n",
      "344\n",
      "345\n",
      "346\n",
      "347\n",
      "348\n",
      "349\n",
      "350\n",
      "351\n",
      "352\n",
      "353\n",
      "354\n",
      "355\n",
      "356\n",
      "357\n",
      "358\n",
      "359\n",
      "360\n",
      "361\n",
      "362\n",
      "363\n",
      "364\n",
      "365\n",
      "366\n",
      "367\n",
      "368\n",
      "369\n",
      "370\n",
      "371\n",
      "372\n",
      "373\n",
      "374\n",
      "375\n",
      "376\n",
      "377\n",
      "378\n",
      "379\n",
      "380\n",
      "381\n",
      "382\n",
      "383\n",
      "384\n",
      "385\n",
      "386\n",
      "387\n",
      "388\n",
      "389\n",
      "390\n",
      "391\n",
      "392\n",
      "393\n",
      "394\n",
      "395\n",
      "396\n",
      "397\n",
      "398\n",
      "399\n",
      "400\n",
      "401\n",
      "402\n",
      "403\n",
      "404\n",
      "405\n",
      "406\n",
      "407\n",
      "408\n",
      "409\n",
      "410\n",
      "411\n",
      "412\n",
      "413\n",
      "414\n",
      "415\n",
      "416\n",
      "417\n",
      "418\n",
      "419\n",
      "420\n",
      "421\n",
      "422\n",
      "423\n",
      "424\n",
      "425\n",
      "426\n",
      "427\n",
      "428\n",
      "429\n",
      "430\n",
      "431\n",
      "432\n",
      "433\n",
      "434\n",
      "435\n",
      "436\n",
      "437\n",
      "438\n",
      "439\n",
      "440\n",
      "441\n",
      "442\n",
      "443\n",
      "444\n",
      "445\n",
      "446\n",
      "447\n",
      "448\n",
      "449\n",
      "450\n",
      "451\n",
      "452\n",
      "453\n",
      "454\n",
      "455\n",
      "456\n",
      "457\n",
      "458\n",
      "459\n",
      "460\n",
      "461\n",
      "462\n",
      "463\n",
      "464\n",
      "465\n",
      "466\n",
      "467\n",
      "468\n",
      "469\n",
      "470\n",
      "471\n",
      "472\n",
      "473\n",
      "474\n",
      "475\n",
      "476\n",
      "477\n",
      "478\n",
      "479\n",
      "480\n",
      "481\n",
      "482\n",
      "483\n",
      "484\n",
      "485\n",
      "486\n",
      "487\n",
      "488\n",
      "489\n",
      "490\n",
      "491\n",
      "492\n",
      "493\n",
      "494\n",
      "495\n",
      "496\n",
      "497\n",
      "498\n",
      "499\n",
      "500\n",
      "501\n",
      "502\n",
      "503\n",
      "504\n",
      "505\n",
      "506\n",
      "507\n",
      "508\n",
      "509\n",
      "510\n",
      "511\n",
      "512\n",
      "513\n",
      "514\n",
      "515\n",
      "516\n",
      "517\n",
      "518\n",
      "519\n",
      "520\n",
      "521\n",
      "522\n",
      "523\n",
      "524\n",
      "525\n",
      "526\n",
      "527\n",
      "528\n",
      "529\n",
      "530\n",
      "531\n",
      "532\n",
      "533\n",
      "534\n",
      "535\n",
      "536\n",
      "537\n",
      "538\n",
      "539\n",
      "540\n",
      "541\n",
      "542\n",
      "543\n",
      "544\n",
      "545\n",
      "546\n",
      "547\n",
      "548\n",
      "549\n",
      "550\n",
      "551\n",
      "552\n",
      "553\n",
      "554\n",
      "555\n",
      "556\n",
      "557\n",
      "558\n",
      "559\n",
      "560\n",
      "561\n",
      "562\n",
      "563\n",
      "564\n",
      "565\n",
      "566\n",
      "567\n",
      "568\n",
      "569\n",
      "570\n",
      "571\n",
      "572\n",
      "573\n",
      "574\n",
      "575\n",
      "576\n",
      "577\n",
      "578\n",
      "579\n",
      "580\n",
      "581\n",
      "582\n",
      "583\n",
      "584\n",
      "585\n",
      "586\n",
      "587\n",
      "588\n",
      "589\n",
      "590\n",
      "591\n",
      "592\n",
      "593\n",
      "594\n",
      "595\n",
      "596\n",
      "597\n",
      "598\n",
      "599\n",
      "600\n",
      "601\n",
      "602\n",
      "603\n",
      "604\n",
      "605\n",
      "606\n",
      "607\n",
      "608\n",
      "609\n",
      "610\n",
      "611\n",
      "612\n",
      "613\n",
      "614\n",
      "615\n",
      "616\n",
      "617\n",
      "618\n",
      "619\n",
      "620\n",
      "621\n",
      "622\n",
      "623\n",
      "624\n",
      "625\n",
      "626\n",
      "627\n",
      "628\n",
      "629\n",
      "630\n",
      "631\n",
      "632\n",
      "633\n",
      "634\n",
      "635\n",
      "636\n",
      "637\n",
      "638\n",
      "639\n",
      "640\n",
      "641\n",
      "642\n",
      "643\n",
      "644\n",
      "645\n",
      "646\n",
      "647\n",
      "648\n",
      "649\n",
      "650\n",
      "651\n",
      "652\n",
      "653\n",
      "654\n",
      "655\n",
      "656\n",
      "657\n",
      "658\n",
      "659\n",
      "660\n",
      "661\n",
      "662\n",
      "663\n",
      "664\n",
      "665\n",
      "666\n",
      "667\n",
      "668\n",
      "669\n",
      "670\n",
      "671\n",
      "672\n",
      "673\n",
      "674\n",
      "675\n",
      "676\n",
      "677\n",
      "678\n",
      "679\n",
      "680\n",
      "681\n",
      "682\n",
      "683\n",
      "684\n",
      "685\n",
      "686\n",
      "687\n",
      "688\n",
      "689\n",
      "690\n",
      "691\n",
      "692\n",
      "693\n",
      "694\n",
      "695\n",
      "696\n",
      "697\n",
      "698\n",
      "699\n",
      "700\n",
      "701\n",
      "702\n",
      "703\n",
      "704\n",
      "705\n",
      "706\n",
      "707\n",
      "708\n",
      "709\n",
      "710\n",
      "711\n",
      "712\n",
      "713\n",
      "714\n",
      "715\n",
      "716\n",
      "717\n",
      "718\n",
      "719\n",
      "720\n",
      "721\n",
      "722\n",
      "723\n",
      "724\n",
      "725\n",
      "726\n",
      "727\n",
      "728\n",
      "729\n",
      "730\n",
      "731\n",
      "732\n",
      "733\n",
      "734\n",
      "735\n",
      "736\n",
      "737\n",
      "738\n",
      "739\n",
      "740\n",
      "741\n",
      "742\n",
      "743\n",
      "744\n",
      "745\n",
      "746\n",
      "747\n",
      "748\n",
      "749\n",
      "750\n",
      "751\n",
      "752\n",
      "753\n",
      "754\n",
      "755\n",
      "756\n",
      "757\n",
      "758\n",
      "759\n",
      "760\n",
      "761\n",
      "762\n",
      "763\n",
      "764\n",
      "765\n",
      "766\n",
      "767\n",
      "768\n",
      "769\n",
      "770\n",
      "771\n",
      "772\n",
      "773\n",
      "774\n",
      "775\n",
      "776\n",
      "777\n",
      "778\n",
      "779\n",
      "780\n",
      "781\n",
      "782\n",
      "783\n",
      "784\n",
      "785\n",
      "786\n",
      "787\n",
      "788\n",
      "789\n",
      "790\n",
      "791\n",
      "792\n",
      "793\n",
      "794\n",
      "795\n",
      "796\n",
      "797\n",
      "798\n",
      "799\n",
      "800\n"
     ]
    }
   ],
   "source": [
    "# PDF下载链接\n",
    "pdf_links=[]\n",
    "link_num = 0\n",
    "\n",
    "for url in href_group_correct:\n",
    "    try:\n",
    "        r = session.get(url)\n",
    "        pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "        pdf_links.append(pdf_link_xpath)\n",
    "        link_num += 1\n",
    "        print(link_num)\n",
    "    except:\n",
    "        continue\n",
    "    time.sleep(1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                               PDF下载链接\n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "..                                                 ...\n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "\n",
       "[800 rows x 1 columns]"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pdf_links_correct=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "df_pdf_download=pd.DataFrame({'PDF下载链接':pdf_links_correct})\n",
    "df_pdf_download"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[800 rows x 2 columns]"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总=pd.concat([df_link,df_pdf_download],axis=1)\n",
    "df_总"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>2020中国情报学年会暨情报学与情报工作发展论坛纪要  网络首发</td>\n",
       "      <td>曹树金; 王雅琪; 赵浜; 卓伊玲</td>\n",
       "      <td>图书情报知识</td>\n",
       "      <td>2021-06-29 11:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>78.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>能源-交通-信息三网融合发展的需求、形态及关键技术  网络首发</td>\n",
       "      <td>何正友; 向悦萍; 廖凯; 杨健维</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-06-28 16:32</td>\n",
       "      <td>NaN</td>\n",
       "      <td>81.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>平台视域下全国居民疫苗接种的认知、意愿及影响要素——基于五大互联网平台的舆情大数据分析  网络首发</td>\n",
       "      <td>喻国明; 杨雅; 陈雪娇</td>\n",
       "      <td>新闻界</td>\n",
       "      <td>2021-06-28 15:33</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>健康医疗大数据背景下医院管理的思路、难点及对策</td>\n",
       "      <td>姚德明;翟晓辉;梅翠竹;王栋;张涛</td>\n",
       "      <td>中国医院</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>86.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>大型三甲医院建立数据驱动的科研项目服务模式实践与探索</td>\n",
       "      <td>孙雅婧;李春漾;杨晓妍;辜永红;张伟</td>\n",
       "      <td>中国医院</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>846</td>\n",
       "      <td>基于并行化K-means的综合能源服务客户识别</td>\n",
       "      <td>沈子垚; 袁晓玲</td>\n",
       "      <td>电力工程技术</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>76.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>847</td>\n",
       "      <td>学科想象与理论生长——兼论计算教育学的错觉</td>\n",
       "      <td>吴刚</td>\n",
       "      <td>教育研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>2.0</td>\n",
       "      <td>315.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>848</td>\n",
       "      <td>我科学家研制成功新型可编程光量子计算芯片</td>\n",
       "      <td>NaN</td>\n",
       "      <td>机床与液压</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>849</td>\n",
       "      <td>高素质专业化审计队伍建设研究</td>\n",
       "      <td>上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>850</td>\n",
       "      <td>粤港澳大湾区大数据审计队伍建设研究</td>\n",
       "      <td>广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>198.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                                 篇名  \\\n",
       "0            51                   2020中国情报学年会暨情报学与情报工作发展论坛纪要  网络首发   \n",
       "1            52                    能源-交通-信息三网融合发展的需求、形态及关键技术  网络首发   \n",
       "2            53  平台视域下全国居民疫苗接种的认知、意愿及影响要素——基于五大互联网平台的舆情大数据分析  网络首发   \n",
       "3            54                            健康医疗大数据背景下医院管理的思路、难点及对策   \n",
       "4            55                         大型三甲医院建立数据驱动的科研项目服务模式实践与探索   \n",
       "..          ...                                                ...   \n",
       "795         846                            基于并行化K-means的综合能源服务客户识别   \n",
       "796         847                              学科想象与理论生长——兼论计算教育学的错觉   \n",
       "797         848                               我科学家研制成功新型可编程光量子计算芯片   \n",
       "798         849                                     高素质专业化审计队伍建设研究   \n",
       "799         850                                  粤港澳大湾区大数据审计队伍建设研究   \n",
       "\n",
       "                               作者       刊名              发表时间   被引     下载  操作  \\\n",
       "0               曹树金; 王雅琪; 赵浜; 卓伊玲   图书情报知识  2021-06-29 11:04  NaN   78.0  下载   \n",
       "1               何正友; 向悦萍; 廖凯; 杨健维  电力系统自动化  2021-06-28 16:32  NaN   81.0  下载   \n",
       "2                    喻国明; 杨雅; 陈雪娇      新闻界  2021-06-28 15:33  NaN  186.0  下载   \n",
       "3               姚德明;翟晓辉;梅翠竹;王栋;张涛     中国医院        2021-06-28  NaN   86.0  下载   \n",
       "4              孙雅婧;李春漾;杨晓妍;辜永红;张伟     中国医院        2021-06-28  NaN   29.0  下载   \n",
       "..                            ...      ...               ...  ...    ...  ..   \n",
       "795                      沈子垚; 袁晓玲   电力工程技术        2021-03-28  NaN   76.0  下载   \n",
       "796                            吴刚     教育研究        2021-03-28  2.0  315.0  下载   \n",
       "797                           NaN    机床与液压        2021-03-28  NaN   54.0  下载   \n",
       "798  上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏     审计研究        2021-03-28  NaN  220.0  下载   \n",
       "799      广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩     审计研究        2021-03-28  NaN  198.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[800 rows x 10 columns]"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_合并=pd.concat([df_url_out,df_总],axis=1)\n",
    "df_合并"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>智能化测绘的基本问题与发展方向  网络首发</td>\n",
       "      <td>陈军; 刘万增; 武昊; Songnian Li; 闫利</td>\n",
       "      <td>测绘学报</td>\n",
       "      <td>2021-07-06 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>国土空间开发适宜性评价的理论、方法与技术应用  网络首发</td>\n",
       "      <td>刘小波;王玉宽;李明</td>\n",
       "      <td>地球信息科学学报</td>\n",
       "      <td>2021-07-06 15:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发</td>\n",
       "      <td>李燕云;王永明;周奇;李亦学;王振</td>\n",
       "      <td>复旦学报(医学版)</td>\n",
       "      <td>2021-07-06 15:53</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>铁路盾构隧道智能建造技术现状与展望  网络首发</td>\n",
       "      <td>陈丹; 刘喆; 刘建友; 房倩; 海路</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-07-06 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发</td>\n",
       "      <td>郑翔; 山茂峰</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-06 15:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>845</th>\n",
       "      <td>795</td>\n",
       "      <td>846</td>\n",
       "      <td>基于并行化K-means的综合能源服务客户识别</td>\n",
       "      <td>沈子垚; 袁晓玲</td>\n",
       "      <td>电力工程技术</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>76.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>846</th>\n",
       "      <td>796</td>\n",
       "      <td>847</td>\n",
       "      <td>学科想象与理论生长——兼论计算教育学的错觉</td>\n",
       "      <td>吴刚</td>\n",
       "      <td>教育研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>2.0</td>\n",
       "      <td>315.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>847</th>\n",
       "      <td>797</td>\n",
       "      <td>848</td>\n",
       "      <td>我科学家研制成功新型可编程光量子计算芯片</td>\n",
       "      <td>NaN</td>\n",
       "      <td>机床与液压</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>848</th>\n",
       "      <td>798</td>\n",
       "      <td>849</td>\n",
       "      <td>高素质专业化审计队伍建设研究</td>\n",
       "      <td>上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>849</th>\n",
       "      <td>799</td>\n",
       "      <td>850</td>\n",
       "      <td>粤港澳大湾区大数据审计队伍建设研究</td>\n",
       "      <td>广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>198.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>850 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                    篇名  \\\n",
       "0        0           1                 智能化测绘的基本问题与发展方向  网络首发   \n",
       "1        1           2          国土空间开发适宜性评价的理论、方法与技术应用  网络首发   \n",
       "2        2           3       基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发   \n",
       "3        3           4               铁路盾构隧道智能建造技术现状与展望  网络首发   \n",
       "4        4           5  互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发   \n",
       "..     ...         ...                                   ...   \n",
       "845    795         846               基于并行化K-means的综合能源服务客户识别   \n",
       "846    796         847                 学科想象与理论生长——兼论计算教育学的错觉   \n",
       "847    797         848                  我科学家研制成功新型可编程光量子计算芯片   \n",
       "848    798         849                        高素质专业化审计队伍建设研究   \n",
       "849    799         850                     粤港澳大湾区大数据审计队伍建设研究   \n",
       "\n",
       "                               作者               刊名              发表时间   被引  \\\n",
       "0    陈军; 刘万增; 武昊; Songnian Li; 闫利             测绘学报  2021-07-06 16:16  NaN   \n",
       "1                      刘小波;王玉宽;李明         地球信息科学学报  2021-07-06 15:54  NaN   \n",
       "2               李燕云;王永明;周奇;李亦学;王振        复旦学报(医学版)  2021-07-06 15:53  NaN   \n",
       "3             陈丹; 刘喆; 刘建友; 房倩; 海路        隧道建设(中英文)  2021-07-06 15:51  NaN   \n",
       "4                         郑翔; 山茂峰  北京交通大学学报(社会科学版)  2021-07-06 15:03  NaN   \n",
       "..                            ...              ...               ...  ...   \n",
       "845                      沈子垚; 袁晓玲           电力工程技术        2021-03-28  NaN   \n",
       "846                            吴刚             教育研究        2021-03-28  2.0   \n",
       "847                           NaN            机床与液压        2021-03-28  NaN   \n",
       "848  上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏             审计研究        2021-03-28  NaN   \n",
       "849      广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩             审计研究        2021-03-28  NaN   \n",
       "\n",
       "        下载  操作                                              详细页链接  \\\n",
       "0      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..     ...  ..                                                ...   \n",
       "845   76.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "846  315.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "847   54.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "848  220.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "849  198.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "845  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "846  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "847  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "848  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "849  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[850 rows x 11 columns]"
      ]
     },
     "execution_count": 46,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总表 = df_首页.append(df_合并).reset_index()\n",
    "df_总表"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>智能化测绘的基本问题与发展方向  网络首发</td>\n",
       "      <td>陈军; 刘万增; 武昊; Songnian Li; 闫利</td>\n",
       "      <td>测绘学报</td>\n",
       "      <td>2021-07-06 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>国土空间开发适宜性评价的理论、方法与技术应用  网络首发</td>\n",
       "      <td>刘小波;王玉宽;李明</td>\n",
       "      <td>地球信息科学学报</td>\n",
       "      <td>2021-07-06 15:54</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发</td>\n",
       "      <td>李燕云;王永明;周奇;李亦学;王振</td>\n",
       "      <td>复旦学报(医学版)</td>\n",
       "      <td>2021-07-06 15:53</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>铁路盾构隧道智能建造技术现状与展望  网络首发</td>\n",
       "      <td>陈丹; 刘喆; 刘建友; 房倩; 海路</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-07-06 15:51</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发</td>\n",
       "      <td>郑翔; 山茂峰</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-07-06 15:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>845</th>\n",
       "      <td>795</td>\n",
       "      <td>846</td>\n",
       "      <td>基于并行化K-means的综合能源服务客户识别</td>\n",
       "      <td>沈子垚; 袁晓玲</td>\n",
       "      <td>电力工程技术</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>76.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>846</th>\n",
       "      <td>796</td>\n",
       "      <td>847</td>\n",
       "      <td>学科想象与理论生长——兼论计算教育学的错觉</td>\n",
       "      <td>吴刚</td>\n",
       "      <td>教育研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>2.0</td>\n",
       "      <td>315.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>847</th>\n",
       "      <td>797</td>\n",
       "      <td>848</td>\n",
       "      <td>我科学家研制成功新型可编程光量子计算芯片</td>\n",
       "      <td>NaN</td>\n",
       "      <td>机床与液压</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>848</th>\n",
       "      <td>798</td>\n",
       "      <td>849</td>\n",
       "      <td>高素质专业化审计队伍建设研究</td>\n",
       "      <td>上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>849</th>\n",
       "      <td>799</td>\n",
       "      <td>850</td>\n",
       "      <td>粤港澳大湾区大数据审计队伍建设研究</td>\n",
       "      <td>广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩</td>\n",
       "      <td>审计研究</td>\n",
       "      <td>2021-03-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>198.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>850 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                    篇名  \\\n",
       "0        0           1                 智能化测绘的基本问题与发展方向  网络首发   \n",
       "1        1           2          国土空间开发适宜性评价的理论、方法与技术应用  网络首发   \n",
       "2        2           3       基于宫颈上皮与血管特征的阴道镜图像深度学习模型探索  网络首发   \n",
       "3        3           4               铁路盾构隧道智能建造技术现状与展望  网络首发   \n",
       "4        4           5  互联网平台经营者市场支配地位的认定——基于平台数据竞争的反思  网络首发   \n",
       "..     ...         ...                                   ...   \n",
       "845    795         846               基于并行化K-means的综合能源服务客户识别   \n",
       "846    796         847                 学科想象与理论生长——兼论计算教育学的错觉   \n",
       "847    797         848                  我科学家研制成功新型可编程光量子计算芯片   \n",
       "848    798         849                        高素质专业化审计队伍建设研究   \n",
       "849    799         850                     粤港澳大湾区大数据审计队伍建设研究   \n",
       "\n",
       "                               作者               刊名              发表时间   被引  \\\n",
       "0    陈军; 刘万增; 武昊; Songnian Li; 闫利             测绘学报  2021-07-06 16:16  NaN   \n",
       "1                      刘小波;王玉宽;李明         地球信息科学学报  2021-07-06 15:54  NaN   \n",
       "2               李燕云;王永明;周奇;李亦学;王振        复旦学报(医学版)  2021-07-06 15:53  NaN   \n",
       "3             陈丹; 刘喆; 刘建友; 房倩; 海路        隧道建设(中英文)  2021-07-06 15:51  NaN   \n",
       "4                         郑翔; 山茂峰  北京交通大学学报(社会科学版)  2021-07-06 15:03  NaN   \n",
       "..                            ...              ...               ...  ...   \n",
       "845                      沈子垚; 袁晓玲           电力工程技术        2021-03-28  NaN   \n",
       "846                            吴刚             教育研究        2021-03-28  2.0   \n",
       "847                           NaN            机床与液压        2021-03-28  NaN   \n",
       "848  上海市审计学会课题组; 钟琼; 王倩莹; 沈一铭; 冯敏             审计研究        2021-03-28  NaN   \n",
       "849      广东省审计学会课题组; 刘柱棠; 宗宇星; 谢珩             审计研究        2021-03-28  NaN   \n",
       "\n",
       "        下载  操作                                              详细页链接  \\\n",
       "0      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4      NaN  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..     ...  ..                                                ...   \n",
       "845   76.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "846  315.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "847   54.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "848  220.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "849  198.0  下载  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "845  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "846  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "847  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "848  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "849  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[850 rows x 11 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# 将内容表格存在本地\n",
    "with pd.ExcelWriter('知网数据.xlsx',mode='w',engine=\"openpyxl\") as writer:  \n",
    "            df_总表.to_excel(writer,sheet_name=\"知网\")\n",
    "display(df_总表)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 爬取refworks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "#回到第一页\n",
    "element = driver.find_element_by_xpath('//*[@id=\"total\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "3"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "5"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "6"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "7"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "9"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "#每页50篇文章，下载大于800篇至少需要翻17页，但知网规定一次最多选取500篇，所以这里设置（0，10）\n",
    "for i in range(0,10):\n",
    "    driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]').click()\n",
    "    driver.find_element_by_id('PageNext').click()\n",
    "    time.sleep(5)\n",
    "    display(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [],
   "source": [
    "#定位到要悬停的元素\n",
    "from selenium.webdriver.common.action_chains import ActionChains\n",
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/a')\n",
    "#对定位到的元素执行悬停操作\n",
    "ActionChains(driver).move_to_element(move).perform()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()\n",
    "driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-1B758225005A24641C60453EB64C9E1A',\n",
       " 'CDwindow-1733F1EB275C115FE0876C7CDA5C1CB6',\n",
       " 'CDwindow-342F9733D14C568963F4744A97DF6063']"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## 查看所有的窗口信息\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-53-889a0c377e4b>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出 refworks\n",
    "element=driver.find_element_by_xpath('//*[@id=\"litotxt\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 后300篇"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-55-7f2dbf209d83>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "#先回到检索窗口\n",
    "driver.switch_to_window(driver.window_handles[1])\n",
    "#消除原先选定\n",
    "element=driver.find_element_by_xpath('//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "3"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "5"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "for i in range(0,6):\n",
    "    driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]').click()\n",
    "    driver.find_element_by_id('PageNext').click()\n",
    "    time.sleep(5)\n",
    "    display(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {},
   "outputs": [],
   "source": [
    "#定位到要悬停的元素\n",
    "from selenium.webdriver.common.action_chains import ActionChains\n",
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/a')\n",
    "#对定位到的元素执行悬停操作\n",
    "ActionChains(driver).move_to_element(move).perform()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()\n",
    "driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-59-0dfe2a1ada8f>:1: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "driver.switch_to_window(driver.window_handles[2])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [],
   "source": [
    "#导出 refworks\n",
    "element=driver.find_element_by_xpath('//*[@id=\"litotxt\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 下载PDF文件"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-62-faaab47612fa>:20: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome(executable_path=r'C:\\Users\\FATJ\\AppData\\Local\\Google\\Chrome\\Application\\chrome.exe', chrome_options=options)\n"
     ]
    },
    {
     "ename": "WebDriverException",
     "evalue": "Message: Service C:\\Users\\FATJ\\AppData\\Local\\Google\\Chrome\\Application\\chrome.exe unexpectedly exited. Status code was: 0\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mWebDriverException\u001b[0m                        Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-62-faaab47612fa>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m     18\u001b[0m \u001b[0mprefs\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;33m{\u001b[0m\u001b[1;34m'profile.default_content_settings.popups'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[1;36m0\u001b[0m\u001b[1;33m,\u001b[0m \u001b[1;34m'download.default_directory'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mout_path\u001b[0m\u001b[1;33m}\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     19\u001b[0m \u001b[0moptions\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0madd_experimental_option\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'prefs'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mprefs\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 20\u001b[1;33m \u001b[0mdriver\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mwebdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mChrome\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mexecutable_path\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34mr'C:\\Users\\FATJ\\AppData\\Local\\Google\\Chrome\\Application\\chrome.exe'\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mchrome_options\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0moptions\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     21\u001b[0m \u001b[1;31m#driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\CloudMusic\\lib\\site-packages\\selenium\\webdriver\\chrome\\webdriver.py\u001b[0m in \u001b[0;36m__init__\u001b[1;34m(self, executable_path, port, options, service_args, desired_capabilities, service_log_path, chrome_options, keep_alive)\u001b[0m\n\u001b[0;32m     71\u001b[0m             \u001b[0mservice_args\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mservice_args\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     72\u001b[0m             log_path=service_log_path)\n\u001b[1;32m---> 73\u001b[1;33m         \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mservice\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstart\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     74\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     75\u001b[0m         \u001b[1;32mtry\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\CloudMusic\\lib\\site-packages\\selenium\\webdriver\\common\\service.py\u001b[0m in \u001b[0;36mstart\u001b[1;34m(self)\u001b[0m\n\u001b[0;32m     96\u001b[0m         \u001b[0mcount\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;36m0\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m     97\u001b[0m         \u001b[1;32mwhile\u001b[0m \u001b[1;32mTrue\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m---> 98\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0massert_process_still_running\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m     99\u001b[0m             \u001b[1;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mis_connectable\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    100\u001b[0m                 \u001b[1;32mbreak\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32mC:\\CloudMusic\\lib\\site-packages\\selenium\\webdriver\\common\\service.py\u001b[0m in \u001b[0;36massert_process_still_running\u001b[1;34m(self)\u001b[0m\n\u001b[0;32m    107\u001b[0m         \u001b[0mreturn_code\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mprocess\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mpoll\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    108\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mreturn_code\u001b[0m \u001b[1;32mis\u001b[0m \u001b[1;32mnot\u001b[0m \u001b[1;32mNone\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 109\u001b[1;33m             raise WebDriverException(\n\u001b[0m\u001b[0;32m    110\u001b[0m                 \u001b[1;34m'Service %s unexpectedly exited. Status code was: %s'\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    111\u001b[0m                 \u001b[1;33m%\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mpath\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mreturn_code\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mWebDriverException\u001b[0m: Message: Service C:\\Users\\FATJ\\AppData\\Local\\Google\\Chrome\\Application\\chrome.exe unexpectedly exited. Status code was: 0\n"
     ]
    }
   ],
   "source": [
    "# 准备工作\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "# opts.binary_location = \"C:\\portable\\PortableApps\\IronPortable\\App\\Iron\\chrome.exe\"\n",
    "# opts.binary_location = \"C:\\Program Files\\Google\\Chrome\\Application\\chromedriver.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "\n",
    "options = webdriver.ChromeOptions()\n",
    "out_path = r'C:\\Users\\FATJ\\Desktop\\web数据挖掘\\web期末\\pdf'  # 是你想指定的路径\n",
    "prefs = {'profile.default_content_settings.popups': 0, 'download.default_directory': out_path}\n",
    "options.add_experimental_option('prefs', prefs)\n",
    "driver = webdriver.Chrome(executable_path=r'C:\\Users\\FATJ\\AppData\\Local\\Google\\Chrome\\Application\\chrome.exe', chrome_options=options)\n",
    "#driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [],
   "source": [
    "def base64__api(uname, pwd, img, typeid):\n",
    "    with open(img, 'rb') as f:\n",
    "        base64_data = base64.b64encode(f.read())\n",
    "        b64 = base64_data.decode()\n",
    "    data = {\"username\": uname, \"password\": pwd, \"typeid\": typeid, \"image\": b64}\n",
    "    result = json.loads(requests.post(\"http://api.ttshitu.com/predict\", json=data).text)\n",
    "    if result['success']:\n",
    "        return result[\"data\"][\"result\"]\n",
    "    else:\n",
    "        return result[\"message\"]\n",
    "    return \"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "面向指挥保障的电磁大数据应用需求分析----已下载\n",
      "大数据时代高校图书馆智慧服务的逻辑与路径----已下载\n",
      "数据驱动型知识生产与数据权力场域----已下载\n",
      "数字防疫中个人信息利用和隐私让渡研究----已下载\n",
      "支持大数据的参数自适应支持向量回归方法  网络首发----已下载\n",
      "异构集群节点与作业特性感知资源分配算法  网络首发----已下载\n",
      "美国海洋科学技术两个“十年”计划比较分析及对我国的启示  网络首发----已下载\n",
      "基于大数据挖掘的电力变压器健康状态差异预警规则策略  网络首发----已下载\n",
      "人工智能深度介入消费金融：动因、风险及防控----已下载\n",
      "中国智慧城市建设的作用机制与路径探索----已下载\n",
      "数字经济的技术基础、价值本质与价值构成----已下载\n",
      "大数据时代下基于象思维的中医状态辨识----已下载\n",
      "长江科学院专家受邀参加第十一届防汛抗旱信息化论坛----已下载\n",
      "大数据时代国家治理中的文化生产与文化整合----已下载\n",
      "大数据时代政府治理的“档案参与”----已下载\n",
      "电网自动电压控制精细规则自动发现技术研究  网络首发----已下载\n",
      "再论智能煤矿建设路线：人工智能3.0视角  网络首发----已下载\n",
      "大数据环境下国家生物安全情报工作体系构建----已下载\n",
      "智慧城市教育公共服务数据治理研究----已下载\n",
      "可撤销属性加密结合快速密度聚类算法的非结构化大数据安全存储方法----已下载\n",
      "我国中小微企业信用评价研究现状与发展趋势----已下载\n",
      "多方计算在个人征信领域中的应用----已下载\n",
      "大数据时代的情报学发展脉络——《中国情报学前沿》评介  网络首发----已下载\n",
      "财务欺诈风险特征筛选框架的建立和应用  网络首发----已下载\n",
      "新时代提升网络意识形态治理效能的创新逻辑----已下载\n",
      "大数据时代信息共享与隐私保护的冲突与平衡----已下载\n",
      "大数据环境下基于谱机器学习的云物流资源配置----已下载\n",
      "大数据技术在水利工程管理中的应用——评《智慧水利大数据理论与方法》----已下载\n",
      "政府数据授权运营的实现机制与内在机理研究——以成都市为例----已下载\n"
     ]
    }
   ],
   "source": [
    "# 读取上面已保存在本地的xlsx文件【利用里面的pdf下载链接】\n",
    "data = pd.read_excel(\"知网数据.xlsx\") \n",
    "base = \"https://kns.cnki.net/\"\n",
    "# 开始与结束的链接序号 count end_count\n",
    "count = 421\n",
    "end_count = 450 \n",
    "# 读取title、pdf链接\n",
    "title_list = data[\"篇名\"].to_list()[count:end_count]\n",
    "download_url_list = data[\"PDF下载链接\"].to_list()[count:end_count]\n",
    "list_all_url_list = data[\"详细页链接\"].to_list()[count:end_count]\n",
    "for title,download_url,list_all_url in zip(title_list,download_url_list,list_all_url_list):\n",
    "    try:\n",
    "        # 进入pdf的下载链接\n",
    "        driver.get(download_url)\n",
    "        time.sleep(5)\n",
    "        # 出现验证码的情况\n",
    "        if driver.find_element_by_xpath('//*[@id=\"vImg\"]'):\n",
    "            time.sleep(5)\n",
    "            ele = driver.find_element_by_id('vImg')\n",
    "            ele.screenshot(r'C:\\Users\\FATJ\\Desktop\\web数据挖掘\\验证码.png')\n",
    "            #截取全屏后定位截图里验证码的位置，并重新裁剪保存\n",
    "            # api识别部分\n",
    "            img_path = r\"C:\\Users\\FATJ\\Desktop\\web数据挖掘\\验证码.png\"\n",
    "            result = base64_api(uname='gyu', pwd='20001026',img=img_path,typeid=3)\n",
    "            # 输出识别出的验证码\n",
    "            print(\"验证码识别：\",result) \n",
    "            # 将验证码填入\n",
    "            driver.find_element_by_id('vcode').send_keys(result)\n",
    "            time.sleep(5)\n",
    "            # 点击验证码的提交，然后开始下载\n",
    "            driver.find_element_by_xpath('/html/body/div/form/dl/dd/button').click()\n",
    "    except:\n",
    "        print(f'{title}----已下载')\n",
    "        continue"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
